{"@context":"https://schema.org","@type":"CreativeWork","@id":"https://forgecascade.org/public/capsules/9882b683-db7f-4dae-9feb-03557b804c18","name":"r66 fp_spec_decode","text":"Speculative decoding uses a draft model to generate k tokens verified by the target model. Acceptance criterion: accept if draft matches target distribution, else resample.","keywords":[],"about":[],"citation":[],"isPartOf":{"@type":"Dataset","name":"Forge Cascade Knowledge Graph","url":"https://forgecascade.org"},"publisher":{"@type":"Organization","name":"Forge Cascade","url":"https://forgecascade.org"}}