[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"similar-ashishpatel26--Treasure-of-Transformers":3,"tool-ashishpatel26--Treasure-of-Transformers":64},[4,17,27,35,43,56],{"id":5,"name":6,"github_repo":7,"description_zh":8,"stars":9,"difficulty_score":10,"last_commit_at":11,"category_tags":12,"status":16},3808,"stable-diffusion-webui","AUTOMATIC1111\u002Fstable-diffusion-webui","stable-diffusion-webui 是一个基于 Gradio 构建的网页版操作界面，旨在让用户能够轻松地在本地运行和使用强大的 Stable Diffusion 图像生成模型。它解决了原始模型依赖命令行、操作门槛高且功能分散的痛点，将复杂的 AI 绘图流程整合进一个直观易用的图形化平台。\n\n无论是希望快速上手的普通创作者、需要精细控制画面细节的设计师，还是想要深入探索模型潜力的开发者与研究人员，都能从中获益。其核心亮点在于极高的功能丰富度：不仅支持文生图、图生图、局部重绘（Inpainting）和外绘（Outpainting）等基础模式，还独创了注意力机制调整、提示词矩阵、负向提示词以及“高清修复”等高级功能。此外，它内置了 GFPGAN 和 CodeFormer 等人脸修复工具，支持多种神经网络放大算法，并允许用户通过插件系统无限扩展能力。即使是显存有限的设备，stable-diffusion-webui 也提供了相应的优化选项，让高质量的 AI 艺术创作变得触手可及。",162132,3,"2026-04-05T11:01:52",[13,14,15],"开发框架","图像","Agent","ready",{"id":18,"name":19,"github_repo":20,"description_zh":21,"stars":22,"difficulty_score":23,"last_commit_at":24,"category_tags":25,"status":16},1381,"everything-claude-code","affaan-m\u002Feverything-claude-code","everything-claude-code 是一套专为 AI 编程助手（如 Claude Code、Codex、Cursor 等）打造的高性能优化系统。它不仅仅是一组配置文件，而是一个经过长期实战打磨的完整框架，旨在解决 AI 代理在实际开发中面临的效率低下、记忆丢失、安全隐患及缺乏持续学习能力等核心痛点。\n\n通过引入技能模块化、直觉增强、记忆持久化机制以及内置的安全扫描功能，everything-claude-code 能显著提升 AI 在复杂任务中的表现，帮助开发者构建更稳定、更智能的生产级 AI 代理。其独特的“研究优先”开发理念和针对 Token 消耗的优化策略，使得模型响应更快、成本更低，同时有效防御潜在的攻击向量。\n\n这套工具特别适合软件开发者、AI 研究人员以及希望深度定制 AI 工作流的技术团队使用。无论您是在构建大型代码库，还是需要 AI 协助进行安全审计与自动化测试，everything-claude-code 都能提供强大的底层支持。作为一个曾荣获 Anthropic 黑客大奖的开源项目，它融合了多语言支持与丰富的实战钩子（hooks），让 AI 真正成长为懂上",138956,2,"2026-04-05T11:33:21",[13,15,26],"语言模型",{"id":28,"name":29,"github_repo":30,"description_zh":31,"stars":32,"difficulty_score":23,"last_commit_at":33,"category_tags":34,"status":16},2271,"ComfyUI","Comfy-Org\u002FComfyUI","ComfyUI 是一款功能强大且高度模块化的视觉 AI 引擎，专为设计和执行复杂的 Stable Diffusion 图像生成流程而打造。它摒弃了传统的代码编写模式，采用直观的节点式流程图界面，让用户通过连接不同的功能模块即可构建个性化的生成管线。\n\n这一设计巧妙解决了高级 AI 绘图工作流配置复杂、灵活性不足的痛点。用户无需具备编程背景，也能自由组合模型、调整参数并实时预览效果，轻松实现从基础文生图到多步骤高清修复等各类复杂任务。ComfyUI 拥有极佳的兼容性，不仅支持 Windows、macOS 和 Linux 全平台，还广泛适配 NVIDIA、AMD、Intel 及苹果 Silicon 等多种硬件架构，并率先支持 SDXL、Flux、SD3 等前沿模型。\n\n无论是希望深入探索算法潜力的研究人员和开发者，还是追求极致创作自由度的设计师与资深 AI 绘画爱好者，ComfyUI 都能提供强大的支持。其独特的模块化架构允许社区不断扩展新功能，使其成为当前最灵活、生态最丰富的开源扩散模型工具之一，帮助用户将创意高效转化为现实。",107662,"2026-04-03T11:11:01",[13,14,15],{"id":36,"name":37,"github_repo":38,"description_zh":39,"stars":40,"difficulty_score":23,"last_commit_at":41,"category_tags":42,"status":16},3704,"NextChat","ChatGPTNextWeb\u002FNextChat","NextChat 是一款轻量且极速的 AI 助手，旨在为用户提供流畅、跨平台的大模型交互体验。它完美解决了用户在多设备间切换时难以保持对话连续性，以及面对众多 AI 模型不知如何统一管理的痛点。无论是日常办公、学习辅助还是创意激发，NextChat 都能让用户随时随地通过网页、iOS、Android、Windows、MacOS 或 Linux 端无缝接入智能服务。\n\n这款工具非常适合普通用户、学生、职场人士以及需要私有化部署的企业团队使用。对于开发者而言，它也提供了便捷的自托管方案，支持一键部署到 Vercel 或 Zeabur 等平台。\n\nNextChat 的核心亮点在于其广泛的模型兼容性，原生支持 Claude、DeepSeek、GPT-4 及 Gemini Pro 等主流大模型，让用户在一个界面即可自由切换不同 AI 能力。此外，它还率先支持 MCP（Model Context Protocol）协议，增强了上下文处理能力。针对企业用户，NextChat 提供专业版解决方案，具备品牌定制、细粒度权限控制、内部知识库整合及安全审计等功能，满足公司对数据隐私和个性化管理的高标准要求。",87618,"2026-04-05T07:20:52",[13,26],{"id":44,"name":45,"github_repo":46,"description_zh":47,"stars":48,"difficulty_score":23,"last_commit_at":49,"category_tags":50,"status":16},2268,"ML-For-Beginners","microsoft\u002FML-For-Beginners","ML-For-Beginners 是由微软推出的一套系统化机器学习入门课程，旨在帮助零基础用户轻松掌握经典机器学习知识。这套课程将学习路径规划为 12 周，包含 26 节精炼课程和 52 道配套测验，内容涵盖从基础概念到实际应用的完整流程，有效解决了初学者面对庞大知识体系时无从下手、缺乏结构化指导的痛点。\n\n无论是希望转型的开发者、需要补充算法背景的研究人员，还是对人工智能充满好奇的普通爱好者，都能从中受益。课程不仅提供了清晰的理论讲解，还强调动手实践，让用户在循序渐进中建立扎实的技能基础。其独特的亮点在于强大的多语言支持，通过自动化机制提供了包括简体中文在内的 50 多种语言版本，极大地降低了全球不同背景用户的学习门槛。此外，项目采用开源协作模式，社区活跃且内容持续更新，确保学习者能获取前沿且准确的技术资讯。如果你正寻找一条清晰、友好且专业的机器学习入门之路，ML-For-Beginners 将是理想的起点。",84991,"2026-04-05T10:45:23",[14,51,52,53,15,54,26,13,55],"数据工具","视频","插件","其他","音频",{"id":57,"name":58,"github_repo":59,"description_zh":60,"stars":61,"difficulty_score":10,"last_commit_at":62,"category_tags":63,"status":16},3128,"ragflow","infiniflow\u002Fragflow","RAGFlow 是一款领先的开源检索增强生成（RAG）引擎，旨在为大语言模型构建更精准、可靠的上下文层。它巧妙地将前沿的 RAG 技术与智能体（Agent）能力相结合，不仅支持从各类文档中高效提取知识，还能让模型基于这些知识进行逻辑推理和任务执行。\n\n在大模型应用中，幻觉问题和知识滞后是常见痛点。RAGFlow 通过深度解析复杂文档结构（如表格、图表及混合排版），显著提升了信息检索的准确度，从而有效减少模型“胡编乱造”的现象，确保回答既有据可依又具备时效性。其内置的智能体机制更进一步，使系统不仅能回答问题，还能自主规划步骤解决复杂问题。\n\n这款工具特别适合开发者、企业技术团队以及 AI 研究人员使用。无论是希望快速搭建私有知识库问答系统，还是致力于探索大模型在垂直领域落地的创新者，都能从中受益。RAGFlow 提供了可视化的工作流编排界面和灵活的 API 接口，既降低了非算法背景用户的上手门槛，也满足了专业开发者对系统深度定制的需求。作为基于 Apache 2.0 协议开源的项目，它正成为连接通用大模型与行业专有知识之间的重要桥梁。",77062,"2026-04-04T04:44:48",[15,14,13,26,54],{"id":65,"github_repo":66,"name":67,"description_en":68,"description_zh":69,"ai_summary_zh":69,"readme_en":70,"readme_zh":71,"quickstart_zh":72,"use_case_zh":73,"hero_image_url":74,"owner_login":75,"owner_name":76,"owner_avatar_url":77,"owner_bio":78,"owner_company":79,"owner_location":80,"owner_email":81,"owner_twitter":82,"owner_website":83,"owner_url":84,"languages":85,"stars":90,"forks":91,"last_commit_at":92,"license":93,"difficulty_score":94,"env_os":95,"env_gpu":95,"env_ram":95,"env_deps":96,"category_tags":103,"github_topics":104,"view_count":123,"oss_zip_url":82,"oss_zip_packed_at":82,"status":16,"created_at":124,"updated_at":125,"faqs":126,"releases":132},671,"ashishpatel26\u002FTreasure-of-Transformers","Treasure-of-Transformers","💁 Awesome Treasure of Transformers Models for Natural Language processing contains papers, videos, blogs, official repo along with colab Notebooks. 🛫☑️","Treasure-of-Transformers 是一个专注于自然语言处理（NLP）领域的开源资源合集，堪称 Transformer 模型的学习宝库。它系统性地整理了从原始 Transformer 到 GPT、BERT 等主流深度学习算法的全套资料。针对 NLP 研究资料分散、代码复现门槛高的问题，Treasure-of-Transformers 将论文、视频教程、技术博客、官方仓库及可运行的 Colab Notebook 聚合在一起，极大提升了获取效率。\n\n无论是渴望深入理解模型原理的研究人员，还是需要快速落地项目的算法工程师，亦或是正在入门的学生，都能在此找到匹配的资源。其独特之处在于不仅提供理论支持，更强调实践操作，每个模型条目都附带了可直接在云端执行的代码示例。这种理论与实践并重的模式，帮助用户轻松跨越从概念到实现的鸿沟，是 NLP 技术栈构建中一份极具价值的参考指南。","# Awesome Treasure of Transformers Models Collection\n\n![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8dc10b5ba7f5.jpg)\n\n![fw.jpg](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_f81f9ff72b3e.jpg)\n\n---\n\n###  🧑‍💻👩‍💻Collection of All NLP Deep learning algorithm list with Code 🧑‍💻👩‍💻![Jupyter Notebook](https:\u002F\u002Fimg.shields.io\u002Fbadge\u002Fjupyter-%23FA0F00.svg?style=for-the-badge&logo=jupyter&logoColor=white)\n\n---\n\n| Sr No | Algorithm Name                                               | Year | Blog                                                         | Video                                                        | Official Repo                                                | Code                                                         |\n| ----- | ------------------------------------------------------------ | ---- | ------------------------------------------------------------ | ------------------------------------------------------------ | ------------------------------------------------------------ | ------------------------------------------------------------ |\n| 1     | [GPT-Neo](https:\u002F\u002Fgithub.com\u002FEleutherAI\u002Fgpt-neo)             | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3rYanJk) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F6MI0f6YjJIk) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002FEleutherAI\u002Fgpt-neo) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FEleutherAI\u002FGPTNeo\u002Fblob\u002Fmaster\u002FGPTNeo_example_notebook.ipynb) |\n| 2     | [Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F1706.03762v5)            | 2017 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3DNsrIp) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FiDulhoQ2pro) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Ftensorflow\u002Fmodels\u002Ftree\u002Fmaster\u002Fofficial\u002Fnlp\u002Ftransformer) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fbentrevett\u002Fpytorch-seq2seq\u002Fblob\u002Fmaster\u002F6%20-%20Attention%20is%20All%20You%20Need.ipynb) |\n| 3     | [BERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F1810.04805v2)                   | 2018 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3pPV8PS) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F7kLi8u2dJz0) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Fbert) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FNielsRogge\u002FTransformers-Tutorials\u002Fblob\u002Fmaster\u002FBERT\u002FCustom_Named_Entity_Recognition_with_BERT_only_first_wordpiece.ipynb) |\n| 4     | [GPT](https:\u002F\u002Fs3-us-west-2.amazonaws.com\u002Fopenai-assets\u002Fresearch-covers\u002Flanguage-unsupervised\u002Flanguage_understanding_paper.pdf) | 2018 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3ENPuEn) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F9ebPNEHRwXU) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fhuggingface\u002Ftransformers) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fkeras-team\u002Fkeras-io\u002Fblob\u002Fmaster\u002Fexamples\u002Fgenerative\u002Fipynb\u002Ftext_generation_with_miniature_gpt.ipynb) |\n| 5     | [Universal Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F1807.03819v3)  | 2018 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3lRi6VG) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Ftensorflow\u002Ftensor2tensor) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Ftensorflow\u002Ftensor2tensor\u002Fblob\u002Fmaster\u002Ftensor2tensor\u002Fnotebooks\u002Fhello_t2t.ipynb) |\n| 6     | [T-D](https:\u002F\u002Farxiv.org\u002Fabs\u002F1801.10198v1)                    | 2018 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3F17Ba5) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F__ALQCud-iA) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Ftensorflow\u002Ftensor2tensor) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Ftensorflow\u002Ftensor2tensor\u002Fblob\u002Fmaster\u002Ftensor2tensor\u002Fnotebooks\u002Fhello_t2t.ipynb) |\n| 7     | [GPT-2](https:\u002F\u002Fd4mucfpksywv.cloudfront.net\u002Fbetter-language-models\u002Flanguage-models.pdf) | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3rXapBi) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FX-B3nAN7YRM) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fopenai\u002Fgpt-2) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fhuggingface\u002Fblog\u002Fblob\u002Fmaster\u002Fnotebooks\u002F02_how_to_generate.ipynb) |\n| 8     | [T5](https:\u002F\u002Farxiv.org\u002Fabs\u002F1910.10683v3)                     | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3yjbrZf) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FjgKj-7v2UYU) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Ftext-to-text-transfer-transformer) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FNielsRogge\u002FTransformers-Tutorials\u002Fblob\u002Fmaster\u002FT5\u002FFine_tune_CodeT5_for_generating_docstrings_from_Ruby_code.ipynb) |\n| 9     | [BART](https:\u002F\u002Farxiv.org\u002Fabs\u002F1910.13461v1)                   | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3yead1D) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FXz4fiQNmGSA) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Ffacebookresearch\u002FGENRE) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fmrm8488\u002Fshared_colab_notebooks\u002Fblob\u002Fmaster\u002FBART_with_JS_UI.ipynb) |\n| 10    | [XLNet](https:\u002F\u002Farxiv.org\u002Fabs\u002F1906.08237v2)                  | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3EGEHM5) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F8J8KkuncAmY) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fzihangdai\u002Fxlnet) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fdrive\u002F1YXojI6USFGV3498Pygllv0z8vTMVIiEt) |\n| 11    | [ALBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F1909.11942v6)                 | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3lW9L34) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FLwtj2yUAMgI) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002FALBERT) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fgoogle-research\u002Falbert\u002Fblob\u002Fmaster\u002Falbert_glue_fine_tuning_tutorial.ipynb) |\n| 12    | [Distil-BERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F1910.01108v4)            | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3GPQKHN) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FcCs8exFrGE8) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)]() | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 13    | [Transformer-XL](https:\u002F\u002Farxiv.org\u002Fabs\u002F1901.02860v3)         | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3lW6qkC) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FmqsRZAJav70) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fkimiyoung\u002Ftransformer-xl) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Flab-ml\u002Fnn\u002Fblob\u002Fmaster\u002Flabml_nn\u002Ftransformers\u002Fxl\u002Fexperiment.ipynb) |\n| 14    | [XLM](https:\u002F\u002Farxiv.org\u002Fabs\u002F1901.07291v1)                    | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F31M5BDH) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FcaZLVcJqsqo) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Ffacebookresearch\u002FXLM) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FTikquuss\u002Fmeta_XLM\u002Fblob\u002Fmaster\u002Fnotebooks\u002Fdemo\u002Ftuto.ipynb) |\n| 15    | [ViLBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F1908.02265v1)                | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F31M5KqJ) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002Fdd7nE4nbxN0) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Ffacebookresearch\u002Fvilbert-multi-task\u002F) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Ffacebookresearch\u002Fvilbert-multi-task\u002Fblob\u002F9d645085b54fac6a781257133edabefdfb23e547\u002Fdemo.ipynb) |\n| 16    | [Sparse Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F1904.10509v1)     | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3ELosND) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FjaqjcHmCBfY) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fopenai\u002Fsparse_attention) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002Fptillet\u002Ftorch-blocksparse\u002Fblob\u002Fmaster\u002Fexamples\u002Fsimple.py) |\n| 17    | [Levenshtein Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F1905.11006v2) | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3rUU4wQ) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FFtUbMG3rlFs) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fpytorch\u002Ffairseq) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 18    | [CTRL](https:\u002F\u002Farxiv.org\u002Fabs\u002F1909.05858v2)                   | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F33pJRhX) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002Fq5zw2Wh4Rdo) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fsalesforce\u002Fctrl) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fdrive\u002F1nDh3ayRPJGK5ciPO2D3TFkYZFqclBWHY) |\n| 19    | [VideoBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F1904.01766v2)              | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F31PHkN2) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FEkuyLsJX4QM) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002FMDSKUL\u002FMasterProject) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002Fammesatyajit\u002FVideoBERT) |\n| 20    | [Compressive Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F1911.05507v1) | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3rX1q2L) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F0TMKCQiT1T0) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fdeepmind\u002Fpg19) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002Flucidrains\u002Fcompressive-transformer-pytorch) |\n| 21    | [CuBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2001.00059v3)                 | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3lXcxVH) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FbCPeg0Tp64s) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Fgoogle-research\u002Ftree\u002Fmaster\u002Fcubert) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fai-center-kth\u002FcuBERT-source-code-clustering\u002Fblob\u002Fmain\u002Fsrc\u002Fevaluation.ipynb) |\n| 22    | [BP-Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F1911.04070v1)         | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3yuzqFj) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fyzh119\u002FBPT) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 23    | [Adaptively Sparse Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F1909.00015v2) | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3lXLbyG) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F_pYxa50HTBw) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fdeep-spin\u002Fentmax) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fprajjwal1\u002Fadaptive_transformer\u002Fblob\u002F8f062a7d5c6573ebdb1aa2b57113db918156b15a\u002Fnbs\u002Fadaptive_train.ipynb) |\n| 24    | [Sandwich Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F1911.03864v2)   | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F31V686t) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FEM8xFAjtZUQ) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fofirpress\u002Fsandwich_transformer) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002Flucidrains\u002Fx-transformers) |\n| 25    | [FSMT](https:\u002F\u002Farxiv.org\u002Fabs\u002F1907.06616)                     | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3oIFarp) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fpytorch\u002Ffairseq\u002Ftree\u002Fmain\u002Fexamples\u002Fwmt19) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fhuggingface.co\u002Ftransformers\u002Fv3.5.1\u002Fmodel_doc\u002Ffsmt.html) |\n| 26    | [LXMERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F1908.07490)                   | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3oJq19i) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fairsplay\u002Flxmert) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fdrive\u002F18TyuMfZYlgQ_nXo-tr8LCnzUaoX0KS-h?usp=sharing) |\n| 27    | [VisualBERT](https:\u002F\u002Farxiv.org\u002Fpdf\u002F1908.03557)               | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3s0AgIq) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FLhi1UFsXvpk) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fuclanlp\u002Fvisualbert) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fuclanlp\u002Fvisualbert\u002Fblob\u002Fe49b61906dff12f1b2992226ae84c538fcf438e4\u002Funsupervised_visualbert\u002Fdata\u002Fnlvr2\u002Fnlvr\u002Fnlvr2\u002FNLVR2BiasAnalysis.ipynb) |\n| 28    | [GPT-3](https:\u002F\u002Farxiv.org\u002Fabs\u002F2005.14165v4)                  | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3oIFwhJ) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FSboKeK6FFHQ) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fopenai\u002Fgpt-3) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Frafajak\u002Fgpt3_examples\u002Fblob\u002Fmaster\u002FGPT3_search_example.ipynb) |\n| 29    | [ELECTRA](https:\u002F\u002Farxiv.org\u002Fabs\u002F2003.10555v1)                | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3lUZGDy) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002Fp9c7SoD4AMc) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Felectra) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fdrive\u002F1DiOwhRjQbtYRgFWG7e3dybcXJsZcu86l) |\n| 30    | [Electric](https:\u002F\u002Farxiv.org\u002Fabs\u002F2012.08561v1)               | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F31SfM9E) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Felectra) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 31    | [LongFormer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2004.05150v2)             | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3oJ03mh) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F_8KNb5iqblE) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fallenai\u002Flongformer) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fpatil-suraj\u002FNotebooks\u002Fblob\u002Fmaster\u002Flongformer_qa_training.ipynb) |\n| 32    | [mBART](https:\u002F\u002Farxiv.org\u002Fabs\u002F2001.08210v2)                  | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3EPC0Ii) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FoO7k5lH8Oe8) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fpytorch\u002Ffairseq\u002Ftree\u002Fmaster\u002Fexamples\u002Fmbart) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fsdhilip200\u002FMachine-Translation-using-mBART-50-and-Hugging-Face\u002Fblob\u002Fmain\u002FMachine_Translation.ipynb) |\n| 33    | [Performer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2009.14794v3)              | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3pLxvYW) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FxJrKIPwVwGM) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Fgoogle-research) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fdrive\u002F1ICW0DpXfUuVYsnNkt1DHwUyyTduHHvE3?usp=sharing) |\n| 34    | [ETC](https:\u002F\u002Farxiv.org\u002Fabs\u002F2004.08483v5)                    | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3rWIy3W) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FTyydOhj28A4) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Fgoogle-research\u002Ftree\u002Fmaster\u002Fetcmodel) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 35    | [CodeBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2002.08155v4)               | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3pPuIhc) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FYmAXluUDPPI) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fmicrosoft\u002FCodeBERT) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fgraykode\u002Fcommit-autosuggestions\u002Fblob\u002F579d7a34f3ebb735d2a9f13afc74eeb66c0d7427\u002Fcommit_autosuggestions.ipynb) |\n| 36    | [mT5](https:\u002F\u002Farxiv.org\u002Fabs\u002F2010.11934v3)                    | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3DJ76jh) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)]() | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fejmejm\u002Fmultilingual-nmt-mt5\u002Fblob\u002Fmain\u002Fnmt_full_version.ipynb) |\n| 37    | [Reformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2001.04451v2)               | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3pPSTMn) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002Fi4H0kjxrias) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle\u002Ftrax\u002Ftree\u002Fmaster\u002Ftrax\u002Fmodels\u002Freformer) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fpatrickvonplaten\u002Fnotebooks\u002Fblob\u002Fmaster\u002FPyTorch_Reformer.ipynb) |\n| 38    | [DeBERTa & DeBERTa-v2](https:\u002F\u002Farxiv.org\u002Fabs\u002F2006.03654v6)   | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3GyaT4F) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F_c6A33Fg5Ns) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fmicrosoft\u002FDeBERTa) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fmusthofasyarifudin\u002FDeberta-Language-Modeling-For-NLP\u002Fblob\u002Fmain\u002FMLM_Deberta_Base.ipynb) |\n| 39    | [Linformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2006.04768v3)              | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3DMx5GH) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F-_2AF9Lhweo) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fkuixu\u002FLinear-Multihead-Attention) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fdrive\u002F1zHenqau3rMo3oS_7EisfGsahSs-1_sok?usp=sharing) |\n| 40    | [RAG](https:\u002F\u002Farxiv.org\u002Fabs\u002F2005.11401v4)                    | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F30f4ig2) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FdzChvuZI6D4) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fhuggingface.co\u002Fdocs\u002Ftransformers\u002Fmodel_doc\u002Frag?utm_source=catalyzex.com) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fipavlopoulos\u002Fmodern_nlp\u002Fblob\u002Ff2a7af7e9de68d505dd1585c04cc51f30433122b\u002FModern_NLP_S5.ipynb) |\n| 41    | [ProphetNet](https:\u002F\u002Farxiv.org\u002Fabs\u002F2001.04063v3)             | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F31RisVr) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F9Hoo_qdjSio) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fmicrosoft\u002FProphetNet) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fdrive\u002F11uPpxZzoTofnHZsyDPaJr5dFKsgOmTD9#scrollTo=j5CRrgNFc_Jq) |\n| 42    | [BigBird](https:\u002F\u002Farxiv.org\u002Fabs\u002F2007.14062v2)                | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3pPTSMz) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FWVPE62Gk3EM) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Fbigbird) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fvasudevgupta7\u002Fbigbird\u002Fblob\u002Fmain\u002Fnotebooks\u002Fevaluate_nq.ipynb) |\n| 43    | [PLATO-2](https:\u002F\u002Farxiv.org\u002Fabs\u002F2006.16779v4)                | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3DF7hMA) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F0zlRRC0jPf4) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002FPaddlePaddle\u002FKnover) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002FPaddlePaddle\u002FPaddleNLP\u002Ftree\u002Fdevelop\u002Fexamples\u002Fdialogue\u002Fplato-2) |\n| 44    | [Routing Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2003.05997v5)    | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3IGcabW) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Flucidrains\u002Frouting-transformer) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fdrive\u002F1sw1Hjx3EllhKZh4nhJ3TIZ978HjKVUFQ?usp=sharing) |\n| 45    | [DeeBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2004.12993v1)                | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3GB1Ks8) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fcastorini\u002FDeeBERT) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fcastorini\u002FDeeBERT\u002Fblob\u002F3efc01db07a0bed88e19551992b8378994195d1c\u002Fnotebooks\u002FComparing-TF-and-PT-models-SQuAD.ipynb) |\n| 46    | [DynaBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2004.04037v2)               | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3EGKyRz) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FUuGYwjCOGQo) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fhuawei-noah\u002FPretrained-Language-Model\u002Ftree\u002Fmaster\u002FDynaBERT) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002Fhuawei-noah\u002FPretrained-Language-Model\u002Ftree\u002Fmaster\u002FDynaBERT) |\n| 47    | [TernaryBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2009.12812v3)            | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3dECdlu) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fpapertalk.org\u002Fpapertalks\u002F11743) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fhuawei-noah\u002FPretrained-Language-Model\u002Ftree\u002Fmaster\u002FTernaryBERT) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002Fhuawei-noah\u002FPretrained-Language-Model\u002Ftree\u002Fmaster\u002FTernaryBERT) |\n| 48    | [MobileBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2004.02984v2)             | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3yirFlJ) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Fgoogle-research) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fsayakpaul\u002FBERT-for-Mobile\u002Fblob\u002Fmaster\u002FMobileBERT_Keras.ipynb) |\n| 49    | [Bort](https:\u002F\u002Farxiv.org\u002Fabs\u002F2010.10499v2)                   | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3oMixme) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Falexa\u002Fbort) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 50    | [DeLighT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2008.00623v2)                | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3DRXQtq) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F-AVqR2qZHb4) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fsacmehta\u002Fdelight) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 51    | [PAR Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2009.04534v3)        | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3s26Nhk) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002FJmkernes\u002FPAR-Transformer-XL) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002FJmkernes\u002FPAR-Transformer-XL\u002Fblob\u002Fee2c2bd5cd672eddbe06d68614298de8283c5b2f\u002Fcolab.ipynb) |\n| 52    | [ConvBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2008.02496v3)               | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3pKkqPi) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fbit.ly\u002F321uKKx) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fyitu-opensource\u002FConvBert) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fdrive\u002F1WIu2Cc1C8E7ayZBzEmpfd5sXOhe7Ehhz?usp=sharing) |\n| 53    | [IB-BERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2004.02984v2)                | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3dKRvVT) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Fgoogle-research) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Flordtt13\u002Ftransformers-experiments\u002Fblob\u002F5ea4537ee0662fb6ca2ba736a50f4894197eec60\u002FCustom%20Tasks\u002Femo-mobilebert.ipynb) |\n| 54    | [MacBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2004.13922v2)                | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3GTTdkv) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fymcui\u002FMacBERT) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fshibing624\u002Fnlp-tutorial\u002Fblob\u002Fc9c00b2160397248381203658194a63044e7d7d5\u002F03_language_model\u002F03_Bert%E5%AE%8C%E5%BD%A2%E5%A1%AB%E7%A9%BA.ipynb) |\n| 55    | [RealFormer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2012.11747v3)             | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3EQSoYW) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fbit.ly\u002F3DMWyzG) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Fgoogle-research) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002Fjaketae\u002Frealformer) |\n| 56    | [Sinkhorn Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2002.11296v1)   | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3yjJOiV) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Flucidrains\u002Fsinkhorn-transformer) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fdrive\u002F1Eej8U4pP5ldZOz3tHwpoBFgmQqLhQLUq) |\n| 57    | [SongNet](https:\u002F\u002Farxiv.org\u002Fabs\u002F2004.08022v2)                | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3ym2hLH) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Flipiji\u002FSongNet) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 58    | [Funnel Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2006.03236v1)     | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F31WfMWc) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FQsIcEqGriGg) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Flaiguokun\u002FFunnel-Transformer) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FiIsunnyIi\u002FFunnel-Transformer\u002Fblob\u002Fmain\u002FFunnel_IntentRecognition.ipynb) |\n| 59    | [SC-GPT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2002.12328v1)                 | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F31VCldV) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FNWHqFbgHqng) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fpengbaolin\u002FSC-GPT) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 60    | [SMITH](https:\u002F\u002Farxiv.org\u002Fabs\u002F2004.12297v2)                  | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3dHyOm2) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FVHsYJu9VzyI) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Fgoogle-research\u002Ftree\u002Fmaster\u002Fsmith) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 61    | [BinaryBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2012.15701v2)             | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3dNguYx) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fhuawei-noah\u002FPretrained-Language-Model\u002Ftree\u002Fmaster\u002FBinaryBERT) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 62    | [SqueezeBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2006.11316v1)            | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3EPfqiT) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FkPMaEYSywdI) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fhuggingface\u002Ftransformers\u002Fblob\u002Fmaster\u002Fsrc\u002Ftransformers\u002Fmodeling_squeezebert.py) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Furainshah\u002FUse-of-transformers-hugging-face\u002Fblob\u002Fmain\u002Ffakenews_squeezebert1.ipynb) |\n| 63    | [Feedback Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2002.09402v3)   | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F31VDQJ5) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F-QH8fRhqFHM) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Ffacebookresearch\u002Ftransformer-sequential) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Frajaswa\u002Ffeedback-and-memory-in-transformers\u002Fblob\u002Fmain\u002FFeedback_and_Memory_in_Transformers.ipynb) |\n| 64    | [CamemBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F1911.03894)                | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3yj1AD0) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fhuggingface.co\u002Fdocs\u002Ftransformers\u002Fmodel_doc\u002Fcamembert) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FSimonLembeye\u002Ffrench-sentence-embedding\u002Fblob\u002Fmaster\u002Fsentence_transformers_camembert.ipynb) |\n| 65    | [CPM](https:\u002F\u002Farxiv.org\u002Fabs\u002F2012.00413)                      | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F30jaW4W) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FdFTG3ohAcso) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](github.com\u002FTsinghuaAI\u002FCPM-1-Generate) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 66    | [DialoGPT](https:\u002F\u002Farxiv.org\u002Fabs\u002F1911.00536)                 | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3dKCT8T) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FZo679MYoJns) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fmicrosoft\u002FDialoGPT) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fdrive\u002F1PslHE4Rl4RqSa20s7HEp0ZKITBir6ezE) |\n| 67    | [DPR](https:\u002F\u002Farxiv.org\u002Fabs\u002F2004.04906)                      | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3oLM0g0) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FDBsxUSUhfRg) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Ffacebookresearch\u002FDPR) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fdeepset-ai\u002Fhaystack\u002Fblob\u002Fmaster\u002Ftutorials\u002FTutorial1_Basic_QA_Pipeline.ipynb) |\n| 68    | [FlauBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F1912.05372)                 | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3GENX40) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fbit.ly\u002F3GElYkU) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgetalp\u002FFlaubert) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FRushikesh10\u002FFlauBERT-Text-Summarization\u002Fblob\u002Fmain\u002FFlauBERT%20Colab%20Notebook.ipynb) |\n| 69    | [HerBERT](https:\u002F\u002Fwww.aclweb.org\u002Fanthology\u002F2020.acl-main.111.pdf) | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3GyppJM) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fbit.ly\u002F3dOIR92) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fallegro\u002Fklejbenchmark-baselines) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fklinkeklinke\u002FTransformersTransferLearning\u002Fblob\u002F32aae9ee170a9c7fe4037a9dc7d3cee150805c38\u002Ftransfer_learning_nlp.ipynb#scrollTo=c4cf3720) |\n| 70    | [LayoutLM](https:\u002F\u002Farxiv.org\u002Fabs\u002F1912.13318)                 | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3rWIukZ) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FzazN_yFWlLM) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fmicrosoft\u002Funilm) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FNielsRogge\u002FTransformers-Tutorials\u002Fblob\u002Fmaster\u002FLayoutLM\u002FFine_tuning_LayoutLMForTokenClassification_on_FUNSD.ipynb) |\n| 71    | [LED](https:\u002F\u002Farxiv.org\u002Fabs\u002F2004.05150)                      | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3pTAGh4) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F_8KNb5iqblE) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fallenai\u002Flongformer) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fallenai\u002Flongformer\u002Fblob\u002Fmaster\u002Fscripts\u002Fconvert_model_to_long.ipynb) |\n| 72    | [LUKE](https:\u002F\u002Farxiv.org\u002Fabs\u002F2010.01057)                     | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3rYxxiC) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002Foho-i5Ws07g) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fstudio-ousia\u002Fluke) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FNielsRogge\u002FTransformers-Tutorials\u002Fblob\u002Fmaster\u002FLUKE\u002FSupervised_relation_extraction_with_LukeForEntityPairClassification.ipynb) |\n| 73    | [M2M100](https:\u002F\u002Farxiv.org\u002Fabs\u002F2010.11125)                   | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F33jc6P3) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fbit.ly\u002F30u83yw) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fpytorch\u002Ffairseq) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fharveenchadha\u002Fbol\u002Fblob\u002Fmain\u002Fdemos\u002Fgr\u002Fhindi\u002FSpeech_ASR_plus_Translation_Hindi.ipynb) |\n| 74    | [MBart and MBart-50](https:\u002F\u002Farxiv.org\u002Fabs\u002F2001.08210)       | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3lZelh1) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FoO7k5lH8Oe8) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fpytorch\u002Ffairseq\u002Ftree\u002Fmaster\u002Fexamples\u002Fmbart) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fsdhilip200\u002FMachine-Translation-using-mBART-50-and-Hugging-Face\u002Fblob\u002Fmain\u002FMachine_Translation.ipynb) |\n| 75    | [MegatronBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F1909.08053)             | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3IMtdZO) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FwBgpMf_KQVw) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002FNVIDIA\u002FMegatron-LM) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fkssteven418\u002FQ-ASR\u002Fblob\u002F0ad68cdeddbd5a4c8edba6a0876470ec48186584\u002Ftutorials\u002Fnlp\u002FRelation_Extraction-BioMegatron.ipynb) |\n| 76    | [MegatronGPT2](https:\u002F\u002Farxiv.org\u002Fabs\u002F1909.08053)             | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F33tQMGV) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)]() | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002F877152223\u002FBugInjector\u002Fblob\u002F4cf14e237b97a724edbb4b1300170c3cc832fc2f\u002FBugInjector-GPT2.ipynb) |\n| 77    | [MPNet](https:\u002F\u002Farxiv.org\u002Fabs\u002F2004.09297)                    | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3pPD6gO) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FWS1uVMGhlWQ) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fmicrosoft\u002FMPNet) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002F04mayukh\u002FNeutral-tweet-identification-on-OLID-using-Neutrosophy\u002Fblob\u002F45bbd6c57054337e8af6429554f2dda4aef266d1\u002FModels\u002FMPNet.ipynb) |\n| 78    | [Pegasus](https:\u002F\u002Farxiv.org\u002Fpdf\u002F1912.08777.pdf)              | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3mkVsWb) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FnaRdmLvlEzE) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Fpegasus) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FCoGian\u002Fpegasus_demo_huggingface\u002Fblob\u002Fmaster\u002Fpegasus_demo_huggingface.ipynb) |\n| 79    | [PhoBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2003.00744v3)                | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F31Kahul) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F7d--8leiZgA) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fpaperswithcode.com\u002Fpaper\u002Fphobert-pre-trained-language-models-for#code) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fncthuan\u002Ftext_cls_phobert\u002Fblob\u002Fmaster\u002Fphobert_clf.ipynb) |\n| 80    | [QDQBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2004.09602)                  | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3pXReVs) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FmDefFU7rbV0) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fhuggingface\u002Fpytorch-transformers) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FELS-RD\u002Ftransformer-deploy\u002Fblob\u002F814477ce3b3279cff8f8c3947294119f399903b6\u002Fdemo\u002Fquantization_end_to_end.ipynb) |\n| 81    | [RemBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2010.12821)                  | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F31KaNIN) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002FJK1002497318\u002FRemBERT) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fkldarek\u002Fchaii\u002Fblob\u002F194f92b808cb1c81b70b889ab8d061344ef34ef9\u002Ftraining_notebooks\u002FREMBERT_pretraining77.ipynb) |\n| 82    | [RetriBERT](https:\u002F\u002Fyjernite.github.io\u002Flfqa.html)            | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3s0Ta1O) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)]() | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Frobhaslinger\u002FEALI5-redux\u002Fblob\u002F50ce17c33c333a0d9781f00e29888f2844ad6aae\u002Fnotebooks\u002Fqa_step_by_step.ipynb) |\n| 83    | [Speech2Text](https:\u002F\u002Farxiv.org\u002Fabs\u002F2010.05171)              | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F31ZJWI7) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002Fa-OwY2SqKQI) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fpytorch\u002Ffairseq\u002Ftree\u002Fmaster\u002Fexamples\u002Fspeech_to_text) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 84    | [T5v1.1](https:\u002F\u002Farxiv.org\u002Fabs\u002F2002.05202)                   | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3pSWCJm) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Ftext-to-text-transfer-transformer\u002F) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002Flucidrains\u002Fx-transformers) |\n| 85    | [TAPAS](https:\u002F\u002Farxiv.org\u002Fabs\u002F2004.02349)                    | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3lZtfnE) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FZnuEOQrT4h0) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Ftapas) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FNielsRogge\u002FTransformers-Tutorials\u002Fblob\u002Fmaster\u002FTAPAS\u002FEvaluating_TAPAS_on_the_Tabfact_test_set.ipynb) |\n| 86    | [Wav2Vec2](https:\u002F\u002Farxiv.org\u002Fabs\u002F2006.11477)                 | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3GJBADT) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FaUSXvoWfy3w) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fchuachinhon\u002Fwav2vec2_transformers) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fchuachinhon\u002Fwav2vec2_transformers\u002Fblob\u002Fmain\u002Fnotebooks\u002F2.2_wav2vec2_poetry_alt.ipynb) |\n| 87    | [XLM-ProphetNet](https:\u002F\u002Farxiv.org\u002Fabs\u002F2001.04063)           | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3EQ6KbP) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fhuggingface.co\u002Fdocs\u002Ftransformers\u002Fmodel_doc\u002Fxlmprophetnet) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FBiswajit7890\u002FADV-DL-NLP-Notebooks\u002Fblob\u002F2258022d0c06599317ef3db3d53ef8d4826fd0c2\u002Fcustom_language_translation_Training_with_XLMProphetNet_.ipynb) |\n| 88    | [XLM-RoBERTa](https:\u002F\u002Farxiv.org\u002Fabs\u002F1911.02116)              | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3IHnHI3) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fwww.youtube.com\u002Fwatch?v=Ot6A3UFY72c&ab_channel=AISuisse) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Ffacebookresearch\u002Fcc_net) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fedoost\u002Fpert\u002Fblob\u002F29fc78bc36110ea031083a3e7294ce9135026ee1\u002Fpos_xlmroberta_multi.ipynb) |\n| 89    | [XLSR-Wav2Vec2](https:\u002F\u002Farxiv.org\u002Fabs\u002F2006.13979)            | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F33qEO0D) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fbit.ly\u002F3DSHm4e) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002FHLasse\u002Fwav2vec_finetune) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fkingabzpro\u002FWOLOF-ASR-Wav2Vec2\u002Fblob\u002Fe389abae6887788894795b7fd0171b306e3ca752\u002F3-asr-fine-tune-wolof-gdrive.ipynb) |\n| 90    | [Switch Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2101.03961v1)     | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3IHgLup) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F2pbvnxdaKaw) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Ftensorflow\u002Fmesh) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FLoniQin\u002Fenglish-spanish-translation-switch-transformer\u002Fblob\u002Fmain\u002Fenglish_spanish_translation_switch_transformer.ipynb) |\n| 91    | [TNT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2103.00112v3)                    | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3pRazY7) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FHWna2c5VXDg) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fhuawei-noah\u002FCV-Backbones\u002Ftree\u002Fmaster\u002Ftnt_pytorch) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FRishit-dagli\u002FTransformer-in-Transformer\u002Fblob\u002Fmain\u002Fexample\u002Ftnt-example.ipynb) |\n| 92    | [Adaptive Span Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F1905.07799v2) | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F31SYHwT) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fbit.ly\u002F3GFNqib) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Ffacebookresearch\u002Fadaptive-span) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fprajjwal1\u002Fadaptive_transformer\u002Fblob\u002F8f062a7d5c6573ebdb1aa2b57113db918156b15a\u002Fnbs\u002Fadaptive_train.ipynb) |\n| 93    | [Primer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2109.08668v1)                 | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3s1eYKD) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002Fze7poOz-5Pw) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Fgoogle-research\u002Ftree\u002Fmaster\u002Fprimer) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002Flucidrains\u002Fx-transformers#relu) |\n| 94    | [Charformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2106.12672v2)             | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3GH3tfQ) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002Fdebgj24BAZE) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Fgoogle-research\u002Ftree\u002Fmaster\u002Fcharformer) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002Flucidrains\u002Fcharformer-pytorch) |\n| 95    | [MATE](https:\u002F\u002Farxiv.org\u002Fabs\u002F2109.04312v1)                   | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3lZ37cs) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FTsTib7b0zqU) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Ftapas) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fgoogle-research\u002Ftapas\u002Fblob\u002Fmaster\u002Fnotebooks\u002Fsqa_predictions.ipynb) |\n| 96    | [Nystromformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2102.03902v3)          | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3IIzoy4) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002Fm-zrcmRd7E4) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fmlpen\u002FNystromformer) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002Flucidrains\u002Fnystrom-attention) |\n| 97    | [Subformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2101.00234v3)              | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3IKod7X) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fmachelreid\u002Fsubformer) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 98    | [ESACL](https:\u002F\u002Farxiv.org\u002Fabs\u002F2108.11992v1)                  | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F33qph0M) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FdHHvdubDnYM) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fchz816\u002Fesacl) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 99    | [PermuteFormer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2109.02377v2)          | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3pT0ABv) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fcpcp1998\u002Fpermuteformer) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 100   | [NormFormer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2110.09456v2)             | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3DSZbQq) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fpytorch\u002Ffairseq) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 101   | [Fastformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2108.09084v6)             | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3lZ4nME) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FqgUegkefocg) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fmicrosoft\u002Ffastformers) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fwuch15\u002FFastformer\u002Fblob\u002Fmain\u002FFastformer.ipynb) |\n| 102   | [AutoTinyBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2107.13686v1)           | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F31Kfxy5) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fhuawei-noah\u002FPretrained-Language-Model) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002Fhuawei-noah\u002FPretrained-Language-Model\u002Ftree\u002Fmaster\u002FAutoTinyBERT) |\n| 103   | [EGT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2108.03348v2)                    | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3rXLWvt) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F51_K8RDVlXY) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fshamim-hussain\u002Fegt) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 104   | [Chinese Pre-trained Unbalanced   Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2109.05729v3) | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3oOI6mr) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Ffastnlp\u002Fcpt) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002Ffastnlp\u002FCPT) |\n| 105   | [GANFormer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2103.01209v3)              | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3dJjZzt) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FHO-_t0UArd4) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fdorarad\u002Fgansformer) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FGiorgiaAuroraAdorni\u002Fgansformer-reproducibility-challenge\u002Fblob\u002F83c145d9e706d3814cf0eef7036a8e59c2accb2b\u002Fcolab%20notebooks\u002FReproducibility_model_trainer.ipynb) |\n| 106   | [ClipBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2102.06183v1)               | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3ERUCY6) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FcBVdz1FjwVM) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fjayleicn\u002FClipBERT) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 107   | [CodeT5](https:\u002F\u002Farxiv.org\u002Fabs\u002F2109.00859v1)                 | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3oMJp5t) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fsalesforce\u002Fcodet5) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FDehbaiyor\u002FIDLFall2021Project\u002Fblob\u002Fb100172b4477447db82a5c1c96dcef2349592ae4\u002FBaselines\u002Fcodet5-baseline.ipynb) |\n| 108   | [I-BERT](https:\u002F\u002Fpaperswithcode.com\u002Fmethod\u002Fi-bert)           | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3yiN521) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)]() | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fhuggingface.co\u002Fdocs\u002Ftransformers\u002Fmodel_doc\u002Fibert) |\n| 109   | [ByT5](https:\u002F\u002Farxiv.org\u002Fabs\u002F2105.13626)                     | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3dLRpxh) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FvEOYfPPu3ik) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Fbyt5) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fdrive\u002F1rxpI8IlKk-D2crFqi2hdzbTBIezqgsCg?usp=sharing) |\n| 110   | [CANINE](https:\u002F\u002Farxiv.org\u002Fabs\u002F2103.06874)                   | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3EQym0N) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FE17qE148aSM) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Flanguage\u002Ftree\u002Fmaster\u002Flanguage\u002Fcanine) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002FNielsRogge\u002FTransformers-Tutorials\u002Fblob\u002Fmaster\u002FCANINE\u002FFine_tune_CANINE_on_IMDb_(movie_review_binary_classification).ipynb) |\n| 111   | [FNet](https:\u002F\u002Farxiv.org\u002Fabs\u002F2105.03824)                     | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3DR2yrl) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FJJR3pBl78zw) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Frishikksh20\u002FFNet-pytorch) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fvishal-burman\u002FPyTorch-Architectures\u002Fblob\u002Fmaster\u002Fmodeling_FNet\u002Ftest_sample_FNet.ipynb) |\n| 112   | [LayoutLMV2](https:\u002F\u002Farxiv.org\u002Fabs\u002F2012.14740)               | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3dQwpFq) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fbit.ly\u002F3DRodzt) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fmicrosoft\u002Funilm) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fjdegange\u002FMultimodalDocumentTransformers\u002Fblob\u002Fcc03caeca7efc1b17789567cc7a0b7e1c8bdac1a\u002FFine_tuning_LayoutLMv2ForTokenClassification_on_CORD.ipynb) |\n| 113   | [LayoutXLM](https:\u002F\u002Farxiv.org\u002Fabs\u002F2104.08836)                | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3DPjZZ6) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fmicrosoft\u002Funilm\u002Ftree\u002Fmaster\u002Flayoutxlm) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002Fhieuthehungry\u002Flayout_xlm_vnm\u002Fblob\u002Fb35c9f13cd9ea75832d39a74587ca84610d8c659\u002Ffine_tuning_layoutxlm_fortokenclassification_on_cord.py) |\n| 114   | [GPT-J](https:\u002F\u002Fhuggingface.co\u002Fdocs\u002Ftransformers\u002Fmodel_doc\u002Fgptj) | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3EV9WmI) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FS9FhhhQEqiE) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fkingoflolz\u002Fmesh-transformer-jax) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FNielsRogge\u002FTransformers-Tutorials\u002Fblob\u002Fmaster\u002FGPT-J-6B\u002FInference_with_GPT_J_6B.ipynb) |\n| 115   | [Hubert](https:\u002F\u002Farxiv.org\u002Fabs\u002F2106.07447)                   | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3ETLjGU) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002Fp5M7CYZAqfA) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fhuseinzol05\u002Fmalaya-speech) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fshamik-biswas-rft\u002FSpeech2Text\u002Fblob\u002F8c8663b6cd3dbff557e90a6e813b58b17005a2bf\u002Fnotebooks\u002Fautomatic_transcriptions.ipynb) |\n| 116   | [Perceiver](https:\u002F\u002Farxiv.org\u002Fabs\u002F2107.14795)                | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3dNUWLE) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FWJWBq4NZfvY) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fdeepmind\u002Fdeepmind-research\u002Ftree\u002Fmaster\u002Fperceiver) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FNielsRogge\u002FTransformers-Tutorials\u002Fblob\u002Fmaster\u002FPerceiver\u002FPerceiver_for_masked_language_modeling_and_image_classification.ipynb) |\n| 117   | [RoFormer](https:\u002F\u002Farxiv.org\u002Fpdf\u002F2104.09864v1.pdf)           | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F31TNbAX) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FrNG_hpSyZcE) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002FZhuiyiTechnology\u002Froformer) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002FJunnYu\u002FRoFormer_pytorch) |\n| 118   | [SegFormer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2105.15203)                | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3ESxzw3) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FJ0MoRQzZe8U) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002FNVlabs\u002FSegFormer) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FNielsRogge\u002FTransformers-Tutorials\u002Fblob\u002Fmaster\u002FSegFormer\u002FSegformer_inference_notebook.ipynb) |\n| 119   | [SEW](https:\u002F\u002Farxiv.org\u002Fabs\u002F2109.06870)                      | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3EQ4n8V) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fasappresearch\u002Fsew) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fhuggingface.co\u002Fdocs\u002Ftransformers\u002Fmodel_doc\u002Fsew) |\n| 120   | [SEW-D](https:\u002F\u002Farxiv.org\u002Fabs\u002F2109.06870)                    | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3dI3iV3) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fasappresearch\u002Fsew) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fhuggingface.co\u002Fdocs\u002Ftransformers\u002Fmodel_doc\u002Fsew_d) |\n| 121   | [Speech2Text2](https:\u002F\u002Farxiv.org\u002Fabs\u002F2104.06678)             | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3dNMGLn) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FdJAoK5zK36M) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Farxiv.org\u002Fabs\u002F2104.06678) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Farxiv.org\u002Fabs\u002F2104.06678) |\n| 122   | [Splinter](https:\u002F\u002Farxiv.org\u002Fabs\u002F2101.00438)                 | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3dLX86f) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fbit.ly\u002F3oUTyNi) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Foriram\u002Fsplinter) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FQiwei97\u002FMachine-Learning-Models\u002Fblob\u002F67c713c411ec824a2dfcb0d75f1185d2d1b6e354\u002FNLP%20Projects\u002FQuestion%20Answering\u002FSplinter%20TPU.ipynb) |\n| 123   | [TrOCR](https:\u002F\u002Farxiv.org\u002Fabs\u002F2109.10282)                    | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F30mlLmR) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fmicrosoft\u002Funilm\u002Ftree\u002Fmaster\u002Ftrocr) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FNielsRogge\u002FTransformers-Tutorials\u002Fblob\u002Fmaster\u002FTrOCR\u002FInference_with_TrOCR_%2B_Gradio_demo.ipynb) |\n| 124   | [UniSpeech](https:\u002F\u002Farxiv.org\u002Fabs\u002F2101.07597)                | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3rZ5Aaq) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FhS42xD3O55E) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fmicrosoft\u002FUniSpeech) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fhuggingface.co\u002Fdocs\u002Ftransformers\u002Fmodel_doc\u002Funispeech) |\n| 125   | [UniSpeech-SAT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2110.05752)            | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3rY9wZ1) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002Fl4t_ENqo5rE) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fmicrosoft\u002Funispeech) | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fhuggingface.co\u002Fdocs\u002Ftransformers\u002Fmodel_doc\u002Funispeech_sat) |\n| 126   | [MarianMT](https:\u002F\u002Fhuggingface.co\u002Fdocs\u002Ftransformers\u002Fmodel_doc\u002Fmarian) | -    |                                                              |                                                              | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)]() | [![Open In Colab](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fhuggingface.co\u002Fdocs\u002Ftransformers\u002Fmodel_doc\u002Fmarian) |\n\n---\n\n#### Instruction\n\n* All blogs have links and some links contains different languages blog such as Chinese, Korean etc. for this Please use [Google Tranlater Page Convert](https:\u002F\u002Fchrome.google.com\u002Fwebstore\u002Fdetail\u002Fgoogle-translate\u002Faapbdbdomjkkjkaonfhkkikfgjllcleb?hl=en).\n\n---\n\n#### How to Contribute\n\n---\n\nif you want to contribute on this project please send us email: ashishpatel.ce.2011@gmail.com . \n\n🙏🙏Special Thanks to [**Komal Lamba**](https:\u002F\u002Fgithub.com\u002Fkomal11lamba) for contributing.\n\n---\n\nCopyright for source code belongs to the original author(s). However, under fair use you are encouraged to fork and contribute minor corrections and updates for the benefit of the reader(s).\n\n---\n\n**_Thanks for  Reading ...!!!_**\n\n---\n\n","# Transformer 模型宝藏精选集\n\n![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8dc10b5ba7f5.jpg)\n\n![fw.jpg](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_f81f9ff72b3e.jpg)\n\n---\n\n###  🧑‍💻👩‍💻所有自然语言处理（NLP）深度学习算法及代码合集 🧑‍💻👩‍💻![Jupyter Notebook](https:\u002F\u002Fimg.shields.io\u002Fbadge\u002Fjupyter-%23FA0F00.svg?style=for-badge&logo=jupyter&logoColor=white)\n\n---\n\n| 序号 | 算法名称                                               | 年份 | 博客                                                         | 视频                                                        | 官方仓库                                                | 代码                                                         |\n| ----- | ------------------------------------------------------------ | ---- | ------------------------------------------------------------ | ------------------------------------------------------------ | ------------------------------------------------------------ | ------------------------------------------------------------ |\n| 1     | [GPT-Neo](https:\u002F\u002Fgithub.com\u002FEleutherAI\u002Fgpt-neo)             | 2021 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3rYanJk) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F6MI0f6YjJIk) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002FEleutherAI\u002Fgpt-neo) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FEleutherAI\u002FGPTNeo\u002Fblob\u002Fmaster\u002FGPTNeo_example_notebook.ipynb) |\n| 2     | [Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F1706.03762v5)            | 2017 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3DNsrIp) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FiDulhoQ2pro) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Ftensorflow\u002Fmodels\u002Ftree\u002Fmaster\u002Fofficial\u002Fnlp\u002Ftransformer) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fbentrevett\u002Fpytorch-seq2seq\u002Fblob\u002Fmaster\u002F6%20-%20Attention%20is%20All%20You%20Need.ipynb) |\n| 3     | [BERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F1810.04805v2)                   | 2018 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3pPV8PS) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F7kLi8u2dJz0) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Fbert) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FNielsRogge\u002FTransformers-Tutorials\u002Fblob\u002Fmaster\u002FBERT\u002FCustom_Named_Entity_Recognition_with_BERT_only_first_wordpiece.ipynb) |\n| 4     | [GPT](https:\u002F\u002Fs3-us-west-2.amazonaws.com\u002Fopenai-assets\u002Fresearch-covers\u002Flanguage-unsupervised\u002Flanguage_understanding_paper.pdf) | 2018 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3ENPuEn) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F9ebPNEHRwXU) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fhuggingface\u002Ftransformers) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fkeras-team\u002Fkeras-io\u002Fblob\u002Fmaster\u002Fexamples\u002Fgenerative\u002Fipynb\u002Ftext_generation_with_miniature_gpt.ipynb) |\n| 5     | [Universal Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F1807.03819v3)  | 2018 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3lRi6VG) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Ftensorflow\u002Ftensor2tensor) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Ftensorflow\u002Ftensor2tensor\u002Fblob\u002Fmaster\u002Ftensor2tensor\u002Fnotebooks\u002Fhello_t2t.ipynb) |\n| 6     | [T-D](https:\u002F\u002Farxiv.org\u002Fabs\u002F1801.10198v1)                    | 2018 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3F17Ba5) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F__ALQCud-iA) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Ftensorflow\u002Ftensor2tensor) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Ftensorflow\u002Ftensor2tensor\u002Fblob\u002Fmaster\u002Ftensor2tensor\u002Fnotebooks\u002Fhello_t2t.ipynb) |\n| 7     | [GPT-2](https:\u002F\u002Fd4mucfpksywv.cloudfront.net\u002Fbetter-language-models\u002Flanguage-models.pdf) | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3rXapBi) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FX-B3nAN7YRM) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fopenai\u002Fgpt-2) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fhuggingface\u002Fblog\u002Fblob\u002Fmaster\u002Fnotebooks\u002F02_how_to_generate.ipynb) |\n| 8     | [T5](https:\u002F\u002Farxiv.org\u002Fabs\u002F1910.10683v3)                     | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3yjbrZf) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FjgKj-7v2UYU) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Ftext-to-text-transfer-transformer) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FNielsRogge\u002FTransformers-Tutorials\u002Fblob\u002Fmaster\u002FT5\u002FFine_tune_CodeT5_for_generating_docstrings_from_Ruby_code.ipynb) |\n| 9     | [BART](https:\u002F\u002Farxiv.org\u002Fabs\u002F1910.13461v1)                   | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3yead1D) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FXz4fiQNmGSA) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Ffacebookresearch\u002FGENRE) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fmrm8488\u002Fshared_colab_notebooks\u002Fblob\u002Fmaster\u002FBART_with_JS_UI.ipynb) |\n| 10    | [XLNet](https:\u002F\u002Farxiv.org\u002Fabs\u002F1906.08237v2)                  | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3EGEHM5) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F8J8KkuncAmY) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fzihangdai\u002Fxlnet) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fdrive\u002F1YXojI6USFGV3498Pygllv0z8vTMVIiEt) |\n| 11    | [ALBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F1909.11942v6)                 | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3lW9L34) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FLwtj2yUAMgI) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002FALBERT) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fgoogle-research\u002Falbert\u002Fblob\u002Fmaster\u002Falbert_glue_fine_tuning_tutorial.ipynb) |\n| 12    | [Distil-BERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F1910.01108v4)            | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3GPQKHN) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FcCs8exFrGE8) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)]() | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 13    | [Transformer-XL](https:\u002F\u002Farxiv.org\u002Fabs\u002F1901.02860v3)         | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3lW6qkC) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FmqsRZAJav70) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fkimiyoung\u002Ftransformer-xl) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Flab-ml\u002Fnn\u002Fblob\u002Fmaster\u002Flabml_nn\u002Ftransformers\u002Fxl\u002Fexperiment.ipynb) |\n| 14    | [XLM](https:\u002F\u002Farxiv.org\u002Fabs\u002F1901.07291v1)                    | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F31M5BDH) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FcaZLVcJqsqo) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Ffacebookresearch\u002FXLM) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002FTikquuss\u002Fmeta_XLM\u002Fblob\u002Fmaster\u002Fnotebooks\u002Fdemo\u002Ftuto.ipynb) |\n| 15    | [ViLBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F1908.02265v1)                | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F31M5KqJ) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002Fdd7nE4nbxN0) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Ffacebookresearch\u002Fvilbert-multi-task\u002F) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Ffacebookresearch\u002Fvilbert-multi-task\u002Fblob\u002F9d645085b54fac6a781257133edabefdfb23e547\u002Fdemo.ipynb) |\n| 16    | [Sparse Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F1904.10509v1)     | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3ELosND) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FjaqjcHmCBfY) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fopenai\u002Fsparse_attention) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002Fptillet\u002Ftorch-blocksparse\u002Fblob\u002Fmaster\u002Fexamples\u002Fsimple.py) |\n| 17    | [Levenshtein Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F1905.11006v2) | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3rUU4wQ) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FFtUbMG3rlFs) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fpytorch\u002Ffairseq) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 18    | [CTRL](https:\u002F\u002Farxiv.org\u002Fabs\u002F1909.05858v2)                   | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F33pJRhX) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002Fq5zw2Wh4Rdo) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fsalesforce\u002Fctrl) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fdrive\u002F1nDh3ayRPJGK5ciPO2D3TFkYZFqclBWHY) |\n| 19    | [VideoBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F1904.01766v2)              | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F31PHkN2) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FEkuyLsJX4QM) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002FMDSKUL\u002FMasterProject) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002Fammesatyajit\u002FVideoBERT) |\n| 20    | [Compressive Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F1911.05507v1) | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3rX1q2L) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F0TMKCQiT1T0) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fdeepmind\u002Fpg19) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002Flucidrains\u002Fcompressive-transformer-pytorch) |\n| 21    | [CuBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2001.00059v3)                 | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3lXcxVH) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FbCPeg0Tp64s) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Fgoogle-research\u002Ftree\u002Fmaster\u002Fcubert) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fai-center-kth\u002FcuBERT-source-code-clustering\u002Fblob\u002Fmain\u002Fsrc\u002Fevaluation.ipynb) |\n| 22    | [BP-Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F1911.04070v1)         | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3yuzqFj) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fyzh119\u002FBPT) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 23    | [Adaptively Sparse Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F1909.00015v2) | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3lXLbyG) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F_pYxa50HTBw) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fdeep-spin\u002Fentmax) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fprajjwal1\u002Fadaptive_transformer\u002Fblob\u002F8f062a7d5c6573ebdb1aa2b57113db918156b15a\u002Fnbs\u002Fadaptive_train.ipynb) |\n| 24    | [Sandwich Transformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F1911.03864v2)   | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F31V686t) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FEM8xFAjtZUQ) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fofirpress\u002Fsandwich_transformer) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fgithub.com\u002Flucidrains\u002Fx-transformers) |\n| 25    | [FSMT](https:\u002F\u002Farxiv.org\u002Fabs\u002F1907.06616)                     | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3oIFarp) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fpytorch\u002Ffairseq\u002Ftree\u002Fmain\u002Fexamples\u002Fwmt19) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fhuggingface.co\u002Ftransformers\u002Fv3.5.1\u002Fmodel_doc\u002Ffsmt.html) |\n| 26    | [LXMERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F1908.07490)                   | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3oJq19i) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fairsplay\u002Flxmert) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fdrive\u002F18TyuMfZYlgQ_nXo-tr8LCnzUaoX0KS-h?usp=sharing) |\n| 27    | [VisualBERT](https:\u002F\u002Farxiv.org\u002Fpdf\u002F1908.03557)               | 2019 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3s0AgIq) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FLhi1UFsXvpk) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fuclanlp\u002Fvisualbert) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fuclanlp\u002Fvisualbert\u002Fblob\u002Fe49b61906dff12f1b2992226ae84c538fcf438e4\u002Funsupervised_visualbert\u002Fdata\u002Fnlvr2\u002Fnlvr\u002Fnlvr2\u002FNLVR2BiasAnalysis.ipynb) |\n| 28    | [GPT-3](https:\u002F\u002Farxiv.org\u002Fabs\u002F2005.14165v4)                  | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3oIFwhJ) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FSboKeK6FFHQ) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fopenai\u002Fgpt-3) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Frafajak\u002Fgpt3_examples\u002Fblob\u002Fmaster\u002FGPT3_search_example.ipynb) |\n| 29    | [ELECTRA](https:\u002F\u002Farxiv.org\u002Fabs\u002F2003.10555v1)                | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3lUZGDy) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002Fp9c7SoD4AMc) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Felectra) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fdrive\u002F1DiOwhRjQbtYRgFWG7e3dybcXJsZcu86l) |\n| 30    | [Electric](https:\u002F\u002Farxiv.org\u002Fabs\u002F2012.08561v1)               | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F31SfM9E) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Felectra) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 31    | [LongFormer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2004.05150v2)             | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3oJ03mh) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002F_8KNb5iqblE) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fallenai\u002Flongformer) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fpatil-suraj\u002FNotebooks\u002Fblob\u002Fmaster\u002Flongformer_qa_training.ipynb) |\n| 32    | [mBART](https:\u002F\u002Farxiv.org\u002Fabs\u002F2001.08210v2)                  | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3EPC0Ii) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FoO7k5lH8Oe8) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fpytorch\u002Ffairseq\u002Ftree\u002Fmaster\u002Fexamples\u002Fmbart) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fsdhilip200\u002FMachine-Translation-using-mBART-50-and-Hugging-Face\u002Fblob\u002Fmain\u002FMachine_Translation.ipynb) |\n| 33    | [Performer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2009.14794v3)              | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3pLxvYW) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FxJrKIPwVwGM) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Fgoogle-research) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fdrive\u002F1ICW0DpXfUuVYsnNkt1DHwUyyTduHHvE3?usp=sharing) |\n| 34    | [ETC](https:\u002F\u002Farxiv.org\u002Fabs\u002F2004.08483v5)                    | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3rWIy3W) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FTyydOhj28A4) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fgoogle-research\u002Fgoogle-research\u002Ftree\u002Fmaster\u002Fetcmodel) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)]() |\n| 35    | [CodeBERT](https:\u002F\u002Farxiv.org\u002Fabs\u002F2002.08155v4)               | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3pPuIhc) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002FYmAXluUDPPI) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https:\u002F\u002Fgithub.com\u002Fmicrosoft\u002FCodeBERT) | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fgraykode\u002Fcommit-autosuggestions\u002Fblob\u002F579d7a34f3ebb735d2a9f13afc74eeb66c0d7427\u002Fcommit_autosuggestions.ipynb) |\n| 36    | [mT5](https:\u002F\u002Farxiv.org\u002Fabs\u002F2010.11934v3)                    | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3DJ76jh) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)]() | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)]() | [![在 Colab 中打开](https:\u002F\u002Fcolab.research.google.com\u002Fassets\u002Fcolab-badge.svg)](https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002Fejmejm\u002Fmultilingual-nmt-mt5\u002Fblob\u002Fmain\u002Fnmt_full_version.ipynb) |\n| 37    | [Reformer](https:\u002F\u002Farxiv.org\u002Fabs\u002F2001.04451v2)               | 2020 | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_40c0141dc69a.jpg)](https:\u002F\u002Fbit.ly\u002F3pPSTMn) | [![Youtube](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_8aa0e5cb29d1.jpg)](https:\u002F\u002Fyoutu.be\u002Fi4H0kjxrias) | [![](https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_readme_75b99b590e6f.jpg)](https\n\n#### 说明\n\n* 所有博客均包含链接，部分链接指向的语言并非英文（例如中文、韩语等）。为此，请使用 [Google 翻译页面转换](https:\u002F\u002Fchrome.google.com\u002Fwebstore\u002Fdetail\u002Fgoogle-translate\u002Faapbdbdomjkkjkaonfhkkikfgjllcleb?hl=en)。\n\n---\n\n#### 如何贡献\n\n---\n\n如果您希望为本项目做出贡献，请发送邮件至：ashishpatel.ce.2011@gmail.com。\n\n🙏🙏特别感谢 [**Komal Lamba**](https:\u002F\u002Fgithub.com\u002Fkomal11lamba) 的贡献。\n\n---\n\n源代码的版权归属于原作者。然而，依据合理使用原则，我们鼓励您进行 Fork（代码分叉）并贡献细微的修正与更新，以惠及读者。\n\n---\n\n**_感谢您的阅读 ...!!!_**","# Treasure-of-Transformers 快速上手指南\n\n**Treasure-of-Transformers** 是一个精选的 NLP 深度学习算法资源集合库，收录了从 Transformer 到 GPT、BERT 等主流模型的官方代码、教程博客及视频链接。本工具旨在帮助开发者快速查找并复现相关模型。\n\n## 环境准备\n\n由于该仓库主要提供资源索引和 Colab 笔记本链接，无需复杂的本地环境即可开始体验。若需运行本地代码，建议准备以下环境：\n\n- **操作系统**: Windows \u002F macOS \u002F Linux\n- **版本控制**: Git\n- **编程语言**: Python 3.7+ (用于克隆具体模型仓库后运行)\n- **硬件**: \n  - 推荐使用 **Google Colab** (免费 GPU 支持，无需本地配置)。\n  - 本地训练建议配备 NVIDIA GPU (CUDA 环境)。\n- **网络**: 访问 GitHub 及 Colab 的网络连接。\n\n## 安装步骤\n\n本仓库为资源索引库，通过 Git 克隆获取最新资源列表。\n\n1. **克隆仓库**\n   ```bash\n   git clone https:\u002F\u002Fgithub.com\u002Fashishpatel26\u002FTreasure-of-Transformers.git\n   ```\n   > 💡 **国内加速提示**: 若克隆速度较慢，建议使用国内镜像服务（如 `git clone https:\u002F\u002Fhub.fastgit.org\u002Fashishpatel26\u002FTreasure-of-Transformers.git`）。\n\n2. **查看资源**\n   进入目录后，直接打开 `README.md` 文件查看算法列表。\n\n## 基本使用\n\n本工具的核心价值在于其提供的 **Colab Notebook** 链接，这是最快速的验证方式。\n\n### 1. 选择模型\n在 `README.md` 表格中找到感兴趣的算法（例如 `BERT` 或 `GPT-2`）。\n\n### 2. 一键运行 (推荐)\n点击表格中对应的 **\"Open In Colab\"** 徽章链接。\n- 示例链接格式：`https:\u002F\u002Fcolab.research.google.com\u002Fgithub\u002F...`\n- 这将直接在浏览器中打开 Jupyter Notebook，自动挂载 GPU 并加载依赖。\n\n### 3. 本地复现\n若需在本地运行：\n1. 点击表格中的 **\"Official Repo\"** 链接跳转到模型官方仓库。\n2. 参考官方文档安装依赖。\n3. 示例命令（以通用 Transformers 库为例）：\n   ```bash\n   pip install transformers torch\n   ```\n\n### 4. 学习资源\n- **Blog**: 点击博客图标链接阅读技术解析。\n- **Video**: 点击 YouTube 图标观看讲解视频。\n\n通过以上步骤，您可以快速浏览并实践最新的 Transformer 系列模型。","某初创公司的算法工程师小李需要在三天内完成一个医疗文本实体识别的项目原型，急需寻找成熟且易上手的 Transformer 模型方案。\n\n### 没有 Treasure-of-Transformers 时\n- 需要分别去 GitHub、arXiv 和各类技术博客搜索不同模型的论文与代码，信息极度分散导致查找效率低下。\n- 找到的官方仓库往往缺少详细的环境配置说明，本地运行时常因依赖冲突报错，调试陷入困境。\n- 缺乏直观的视频讲解或配套教程笔记，理解复杂的注意力机制原理需要反复阅读晦涩的英文文档。\n\n### 使用 Treasure-of-Transformers 后\n- 直接在资源库中找到 BERT 相关条目，一次性获取了论文、视频教程及官方仓库的完整链接，不再四处翻找。\n- 点击 Colab Notebook 标签即可在云端一键运行示例代码，完全跳过了繁琐的本地环境搭建与依赖安装过程。\n- 结合配套的博客文章解析，迅速掌握了基于 BERT 进行自定义命名实体识别的具体实现细节与调参技巧。\n\nTreasure-of-Transformers 通过整合全链路学习资源，极大降低了 NLP 模型复现的时间门槛与技术难度。","https:\u002F\u002Foss.gittoolsai.com\u002Fimages\u002Fashishpatel26_Treasure-of-Transformers_86cbc252.png","ashishpatel26","Ashish Patel","https:\u002F\u002Foss.gittoolsai.com\u002Favatars\u002Fashishpatel26_9e4e7549.jpg","AI Researcher & Principal Architect AI\u002FML & Data Science at Oracle\r\n| xIBMers | Rank 3 Kaggle Kernel Master","Oracle | xIBMers","Ahmedabad","shriganesh.patel@gmail.com",null,"https:\u002F\u002Fmedium.com\u002Fml-research-lab","https:\u002F\u002Fgithub.com\u002Fashishpatel26",[86],{"name":87,"color":88,"percentage":89},"Jupyter Notebook","#DA5B0B",100,1130,230,"2026-03-30T15:45:46","MIT",1,"未说明",{"notes":97,"python":95,"dependencies":98},"该仓库为 NLP 深度学习算法集合索引，非独立可运行软件包。具体运行环境需求取决于所选用的子项目（如 BERT、GPT 等），通常涉及 PyTorch 或 TensorFlow 框架及 HuggingFace Transformers 库。部分大型模型训练或推理建议配备 GPU。建议参考各子项目官方文档配置环境，或使用 Jupyter Notebook\u002FColab 运行示例代码。",[99,100,101,102],"transformers","torch","tensorflow","jupyter",[13,26,55],[105,106,107,108,101,109,110,111,112,113,114,115,116,117,118,119,120,121,122],"transformer","python","nlp","natural-language-processing","pytorch","speech-recognition","seq2seq","pretrained-models","language-models","natural-language-generation","nlp-library","bert","natural-language-understanding","language-model","pytorch-transformers","model-hub","jax","awesome",4,"2026-03-27T02:49:30.150509","2026-04-06T07:26:08.694766",[127],{"id":128,"question_zh":129,"answer_zh":130,"source_url":131},2785,"XLM-Roberta 教程中的 YouTube 视频链接失效了怎么办？","项目维护者已在评论中确认链接已更新（Updated）。请刷新页面或查看仓库最新内容以获取正确的视频地址。","https:\u002F\u002Fgithub.com\u002Fashishpatel26\u002FTreasure-of-Transformers\u002Fissues\u002F1",[]]