{"url":"http://public2.vulnerablecode.io/api/vulnerabilities/37334?format=json","vulnerability_id":"VCID-jzjy-kj6h-4bas","summary":"vLLM is an inference and serving engine for large language models (LLMs). From  to before 0.20.0, the extract_hidden_states speculative decoding proposer in vLLM returns a tensor with an incorrect shape after the first decode step, causing a RuntimeError that crashes the EngineCore process. The crash is triggered when any request in the batch uses sampling penalty parameters (repetition_penalty, frequency_penalty, or presence_penalty). A single request with a penalty parameter (e.g., \"repetition_penalty\": 1.1) is sufficient to crash the server. This vulnerability is fixed in 0.20.0.","aliases":[{"alias":"CVE-2026-44223"},{"alias":"GHSA-83vm-p52w-f9pw"},{"alias":"PYSEC-2026-145"}],"fixed_packages":[{"url":"http://public2.vulnerablecode.io/api/packages/50315?format=json","purl":"pkg:pypi/vllm@0.20.0","is_vulnerable":false,"affected_by_vulnerabilities":[],"resource_url":"http://public2.vulnerablecode.io/packages/pkg:pypi/vllm@0.20.0"}],"affected_packages":[{"url":"http://public2.vulnerablecode.io/api/packages/49118?format=json","purl":"pkg:pypi/vllm@0.18.0","is_vulnerable":true,"affected_by_vulnerabilities":[{"vulnerability":"VCID-jzjy-kj6h-4bas"},{"vulnerability":"VCID-za3a-c9m1-jqgz"}],"resource_url":"http://public2.vulnerablecode.io/packages/pkg:pypi/vllm@0.18.0"},{"url":"http://public2.vulnerablecode.io/api/packages/49119?format=json","purl":"pkg:pypi/vllm@0.18.1","is_vulnerable":true,"affected_by_vulnerabilities":[{"vulnerability":"VCID-jzjy-kj6h-4bas"},{"vulnerability":"VCID-za3a-c9m1-jqgz"}],"resource_url":"http://public2.vulnerablecode.io/packages/pkg:pypi/vllm@0.18.1"},{"url":"http://public2.vulnerablecode.io/api/packages/49120?format=json","purl":"pkg:pypi/vllm@0.19.0","is_vulnerable":true,"affected_by_vulnerabilities":[{"vulnerability":"VCID-jzjy-kj6h-4bas"}],"resource_url":"http://public2.vulnerablecode.io/packages/pkg:pypi/vllm@0.19.0"},{"url":"http://public2.vulnerablecode.io/api/packages/50314?format=json","purl":"pkg:pypi/vllm@0.19.1","is_vulnerable":true,"affected_by_vulnerabilities":[{"vulnerability":"VCID-jzjy-kj6h-4bas"}],"resource_url":"http://public2.vulnerablecode.io/packages/pkg:pypi/vllm@0.19.1"}],"references":[{"reference_url":"https://github.com/vllm-project/vllm","reference_id":"","reference_type":"","scores":[{"value":"6.5","scoring_system":"cvssv3.1","scoring_elements":"CVSS:3.1/AV:N/AC:L/PR:L/UI:N/S:U/C:N/I:N/A:H"},{"value":"MODERATE","scoring_system":"generic_textual","scoring_elements":""}],"url":"https://github.com/vllm-project/vllm"},{"reference_url":"https://github.com/vllm-project/vllm/pull/38610","reference_id":"","reference_type":"","scores":[{"value":"6.5","scoring_system":"cvssv3.1","scoring_elements":"CVSS:3.1/AV:N/AC:L/PR:L/UI:N/S:U/C:N/I:N/A:H"},{"value":"MODERATE","scoring_system":"generic_textual","scoring_elements":""}],"url":"https://github.com/vllm-project/vllm/pull/38610"},{"reference_url":"https://github.com/vllm-project/vllm/security/advisories/GHSA-83vm-p52w-f9pw","reference_id":"","reference_type":"","scores":[{"value":"6.5","scoring_system":"cvssv3.1","scoring_elements":"CVSS:3.1/AV:N/AC:L/PR:L/UI:N/S:U/C:N/I:N/A:H"},{"value":"MODERATE","scoring_system":"generic_textual","scoring_elements":""}],"url":"https://github.com/vllm-project/vllm/security/advisories/GHSA-83vm-p52w-f9pw"},{"reference_url":"https://nvd.nist.gov/vuln/detail/CVE-2026-44223","reference_id":"","reference_type":"","scores":[{"value":"6.5","scoring_system":"cvssv3.1","scoring_elements":"CVSS:3.1/AV:N/AC:L/PR:L/UI:N/S:U/C:N/I:N/A:H"},{"value":"MODERATE","scoring_system":"generic_textual","scoring_elements":""}],"url":"https://nvd.nist.gov/vuln/detail/CVE-2026-44223"}],"weaknesses":[{"cwe_id":131,"name":"Incorrect Calculation of Buffer Size","description":"The product does not correctly calculate the size to be used when allocating a buffer, which could lead to a buffer overflow."},{"cwe_id":704,"name":"Incorrect Type Conversion or Cast","description":"The product does not correctly convert an object, resource, or structure from one type to a different type."}],"exploits":[],"severity_range_score":"4.0 - 6.9","exploitability":null,"weighted_severity":null,"risk_score":null,"resource_url":"http://public2.vulnerablecode.io/vulnerabilities/VCID-jzjy-kj6h-4bas"}