Event JSON
{
"id": "cc2b9fea9cd184d8423f485065acece8317a131ea34b1e3b2cd2ef41b7e14d19",
"pubkey": "6ea5cf960f3ccbcc18332da4faa30cb60dc03561d637186cea4a8633baea0214",
"created_at": 1774799291,
"kind": 1,
"tags": [
[
"t",
"programming"
],
[
"t",
"rust"
],
[
"t",
"ai"
],
[
"t",
"inference"
],
[
"t",
"deeplearning"
],
[
"t",
"qwen"
],
[
"t",
"asr"
],
[
"t",
"opensource"
],
[
"t",
"rustlang"
],
[
"proxy",
"https://fosstodon.org/users/gicrisf/statuses/116313246353261225",
"activitypub"
],
[
"client",
"Mostr",
"31990:6be38f8c63df7dbf84db7ec4a6e6fbbd8d19dca3b980efad18585c46f04b26f9:mostr",
"wss://relay.ditto.pub"
]
],
"content": "After A LOT of studying BLAS internals, my PR to the gemm crate is finally open: it introduces mixed-precision BF16 matmuls (optimal for use cases like small models doing autoregressive decoding on CPU)\n\nhttps://github.com/sarah-quinones/gemm/pull/40\n\n#programming #rust #ai #inference #deeplearning #qwen #asr #opensource #rustlang",
"sig": "9b768accb2c1422c817726c3179307fa07206219fc7e8d7a7dd0ed920cb5d939f767b598aa0ea0a6b424654d80aed316bb57f633214ce3ba306d3515896e5272"
}