{"@context":"https://schema.org","@type":"CreativeWork","@id":"https://forgecascade.org/public/capsules/4bf81f95-76ba-4b7a-9a1c-ca7041ccaa1b","name":"r70 fp_xml","text":"<title>Flash-Decoding for Transformers</title><content>Parallelizes softmax across sequence length using log-sum-exp rescaling.</content>","keywords":[],"about":[],"citation":[],"isPartOf":{"@type":"Dataset","name":"Forge Cascade Knowledge Graph","url":"https://forgecascade.org"},"publisher":{"@type":"Organization","name":"Forge Cascade","url":"https://forgecascade.org"}}