<?xml version="1.0" encoding="utf-8" standalone="yes"?><rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom"><channel><title>Transformer on wiredwisdom</title><link>https://wiredwisdom.netlify.app/tags/transformer/</link><description>Recent content in Transformer on wiredwisdom</description><generator>Hugo -- gohugo.io</generator><language>en</language><copyright>© 2026</copyright><lastBuildDate>Tue, 31 Mar 2026 08:00:00 +0000</lastBuildDate><atom:link href="https://wiredwisdom.netlify.app/tags/transformer/index.xml" rel="self" type="application/rss+xml"/><item><title>Pruning for Large Language Models — From SparseGPT to KV-Cache Pruning</title><link>https://wiredwisdom.netlify.app/posts/pruning-for-llms/</link><pubDate>Tue, 31 Mar 2026 08:00:00 +0000</pubDate><guid>https://wiredwisdom.netlify.app/posts/pruning-for-llms/</guid><description/></item><item><title>Attention Mechanism</title><link>https://wiredwisdom.netlify.app/posts/attention-mechanism/</link><pubDate>Sun, 23 Jun 2024 00:00:00 +0000</pubDate><guid>https://wiredwisdom.netlify.app/posts/attention-mechanism/</guid><description/></item><item><title>RNN - LSTM - LLM Summary</title><link>https://wiredwisdom.netlify.app/posts/rnn-lstm-llm/</link><pubDate>Fri, 21 Jun 2024 00:00:00 +0000</pubDate><guid>https://wiredwisdom.netlify.app/posts/rnn-lstm-llm/</guid><description/></item></channel></rss>