{"id":5458,"name":"llms-from-scratch","description":"Implement a ChatGPT-like LLM in PyTorch from scratch, step by step","url":"https://github.com/rasbt/llms-from-scratch","last_synced_at":"2025-09-04T18:43:52.729Z","repository":{"id":183291756,"uuid":"669879380","full_name":"rasbt/LLMs-from-scratch","owner":"rasbt","description":"Implement a ChatGPT-like LLM in PyTorch from scratch, step by step","archived":false,"fork":false,"pushed_at":"2025-08-31T16:46:37.000Z","size":14578,"stargazers_count":68384,"open_issues_count":4,"forks_count":9648,"subscribers_count":614,"default_branch":"main","last_synced_at":"2025-08-31T18:21:12.732Z","etag":null,"topics":["ai","artificial-intelligence","chatgpt","deep-learning","from-scratch","gpt","language-model","large-language-models","llm","machine-learning","python","pytorch","transformer"],"latest_commit_sha":null,"homepage":"https://amzn.to/4fqvn0D","language":"Jupyter Notebook","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"other","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/rasbt.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":"LICENSE.txt","code_of_conduct":null,"threat_model":null,"audit":null,"citation":"CITATION.cff","codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null,"zenodo":null,"notice":null,"maintainers":null,"copyright":null,"agents":null,"dco":null,"cla":null}},"created_at":"2023-07-23T18:15:57.000Z","updated_at":"2025-08-31T18:14:44.000Z","dependencies_parsed_at":"2023-07-23T20:36:44.281Z","dependency_job_id":"b17f8409-8f4f-4326-b663-9473161619f7","html_url":"https://github.com/rasbt/LLMs-from-scratch","commit_stats":{"total_commits":647,"total_committers":28,"mean_commits":"23.107142857142858","dds":"0.15455950540958274","last_synced_commit":"1f61aeb7c4396b12e75f7994de0657d257329b0b"},"previous_names":["rasbt/llms-from-scratch"],"tags_count":0,"template":false,"template_full_name":null,"purl":"pkg:github/rasbt/LLMs-from-scratch","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/rasbt%2FLLMs-from-scratch","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/rasbt%2FLLMs-from-scratch/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/rasbt%2FLLMs-from-scratch/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/rasbt%2FLLMs-from-scratch/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/rasbt","download_url":"https://codeload.github.com/rasbt/LLMs-from-scratch/tar.gz/refs/heads/main","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/rasbt%2FLLMs-from-scratch/sbom","scorecard":null,"host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":273656333,"owners_count":25145000,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","status":"online","status_checked_at":"2025-09-04T02:00:08.968Z","response_time":61,"last_error":null,"robots_txt_status":"success","robots_txt_updated_at":"2025-07-24T06:49:26.215Z","robots_txt_url":"https://github.com/robots.txt","online":true,"can_crawl_api":true,"host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"owner":{"login":"rasbt","name":"Sebastian Raschka","uuid":"5618407","kind":"user","description":"Machine Learning and AI researcher \u0026 currently research engineer at a startup","email":"","website":"https://magazine.sebastianraschka.com","location":"Madison, WI","twitter":"rasbt","company":"@Lightning-AI , University of Wisconsin-Madison","icon_url":"https://avatars.githubusercontent.com/u/5618407?u=fb6135afa4c7095d0f94c4c0e0eee37d1979a764\u0026v=4","repositories_count":136,"last_synced_at":"2024-05-14T00:04:50.518Z","metadata":{"has_sponsors_listing":false},"html_url":"https://github.com/rasbt","funding_links":[],"total_stars":85770,"followers":21080,"following":34,"created_at":"2022-11-02T16:34:58.132Z","updated_at":"2024-05-14T00:05:08.895Z","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/rasbt","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/rasbt/repositories"},"packages":[],"commits":{"id":1673581,"full_name":"rasbt/LLMs-from-scratch","default_branch":"main","committers":[{"name":"rasbt","email":"mail@sebastianraschka.com","login":"rasbt","count":646},{"name":"Daniel Kleine","email":"53251018+d-kleine","login":"d-kleine","count":59},{"name":"Intelligence-Manifesto","email":"155522535+Intelligence-Manifesto","login":"Intelligence-Manifesto","count":9},{"name":"TITC","email":"35098797+TITC","login":"TITC","count":7},{"name":"Rayed Bin Wahed","email":"rayed@therapservices.net","login":"rayed-therap","count":6},{"name":"casinca","email":"47400729+casinca","login":"casinca","count":4},{"name":"Ikko Eltociear Ashimine","email":"eltociear@gmail.com","login":"eltociear","count":3},{"name":"Jinge Wang","email":"wjg172184@163.com","login":"jingedawang","count":3},{"name":"Xiaotian Ma","email":"44010854+xiaotian0328","login":"xiaotian0328","count":2},{"name":"Suman Debnath","email":"56056673+debnsuma","login":"debnsuma","count":2},{"name":"Pietro Monticone","email":"38562595+pitmonticone","login":"pitmonticone","count":2},{"name":"Kasen","email":"18170166+imkasen","login":"imkasen","count":2},{"name":"Jeroen Van Goey","email":"jeroen.vangoey@gmail.com","login":"BioGeek","count":2},{"name":"Henry Shi","email":"henrythe9th@gmail.com","login":"henrythe9th","count":2},{"name":"Greg Gandenberger","email":"ggandenberger@shoprunner.com","login":"gsganden","count":2},{"name":"Austin Welch","email":"austinmw","login":"austinmw","count":1},{"name":"Eric Berg","email":"ehberg@gmail.com","login":"ehberg","count":1},{"name":"Eric Thomson","email":"thomson.eric@gmail.com","login":"EricThomson","count":1},{"name":"DrCesar","email":"developer@drcesar.tech","login":null,"count":1},{"name":"Sebastian R","email":"Author@Sebastian-Air.lan","login":null,"count":1},{"name":"Kostyantyn Borysenko","email":"kostya.borysenko@gmail.com","login":null,"count":1},{"name":"rvaneijk","email":"rob@blaeu.com","login":"rvaneijk","count":1},{"name":"ridhachahed","email":"31919686+ridhachahed","login":"ridhachahed","count":1},{"name":"joel-foo","email":"joelfootaimeng@gmail.com","login":"joel-foo","count":1},{"name":"Xiangzhuang Shen","email":"datahonor@gmail.com","login":"shenxiangzhuang","count":1},{"name":"Victor Skvortsov","email":"vds003@gmail.com","login":"r4victor","count":1},{"name":"Tim Hopper","email":"tdhopper","login":"tdhopper","count":1},{"name":"Thanh Tran","email":"thanh.ptit.96@gmail.com","login":"thanhtcptit","count":1},{"name":"Tao Qian","email":"taoxqian@gmail.com","login":"tao-qian","count":1},{"name":"SSebo","email":"ssebo.zzz@gmail.com","login":"SSebo","count":1},{"name":"ROHAN WINSOR","email":"61073765+rohanwinsor","login":"rohanwinsor","count":1},{"name":"QS","email":"41225783+Mike-7777777","login":"Mike-7777777","count":1},{"name":"PRASHANTH REDDY NIMMAKAYALA","email":"nprashanthreddy@outlook.com","login":"NPrashanthReddy","count":1},{"name":"Mingyuan Xu","email":"mix16@pitt.edu","login":"mix16atpitt","count":1},{"name":"Megabyte","email":"NyabutiM@protonmail.com","login":"Shuyib","count":1},{"name":"Matthew Feickert","email":"matthew.feickert@cern.ch","login":"matthewfeickert","count":1},{"name":"Kumar Utsav","email":"krum.utsav@gmail.com","login":"kuutsav","count":1},{"name":"Jeff Hammerbacher","email":"jeff.hammerbacher@gmail.com","login":"hammer","count":1},{"name":"James Holcombe","email":"jameslholcombe@gmail.com","login":"jameslholcombe","count":1},{"name":"speed","email":"69028964+speed1313","login":"speed1313","count":1},{"name":"taihaozesong","email":"taihaozesong@gmail.com","login":"taihaozesong","count":1},{"name":"Gustavo Monti","email":"gustavomr","login":"gustavomr","count":1}],"total_commits":778,"total_committers":42,"total_bot_commits":0,"total_bot_committers":0,"mean_commits":18.523809523809526,"dds":0.16966580976863754,"past_year_committers":[{"name":"Sebastian Raschka","email":"mail@sebastianraschka.com","login":"rasbt","count":330},{"name":"Daniel Kleine","email":"53251018+d-kleine","login":"d-kleine","count":40},{"name":"TITC","email":"35098797+TITC","login":"TITC","count":7},{"name":"casinca","email":"47400729+casinca","login":"casinca","count":4},{"name":"Jinge Wang","email":"wjg172184@163.com","login":"jingedawang","count":3},{"name":"Henry Shi","email":"henrythe9th@gmail.com","login":"henrythe9th","count":2},{"name":"Jeroen Van Goey","email":"jeroen.vangoey@gmail.com","login":"BioGeek","count":2},{"name":"Kasen","email":"18170166+imkasen","login":"imkasen","count":2},{"name":"Greg Gandenberger","email":"ggandenberger@shoprunner.com","login":"gsganden","count":2},{"name":"Kostyantyn Borysenko","email":"kostya.borysenko@gmail.com","login":null,"count":1},{"name":"Austin Welch","email":"austinmw","login":"austinmw","count":1},{"name":"Eric Thomson","email":"thomson.eric@gmail.com","login":"EricThomson","count":1},{"name":"Gustavo Monti","email":"gustavomr","login":"gustavomr","count":1},{"name":"Kumar Utsav","email":"krum.utsav@gmail.com","login":"kuutsav","count":1},{"name":"Matthew Feickert","email":"matthew.feickert@cern.ch","login":"matthewfeickert","count":1},{"name":"Mingyuan Xu","email":"mix16@pitt.edu","login":"mix16atpitt","count":1},{"name":"PRASHANTH REDDY NIMMAKAYALA","email":"nprashanthreddy@outlook.com","login":"NPrashanthReddy","count":1},{"name":"QS","email":"41225783+Mike-7777777","login":"Mike-7777777","count":1},{"name":"ROHAN WINSOR","email":"61073765+rohanwinsor","login":"rohanwinsor","count":1},{"name":"SSebo","email":"ssebo.zzz@gmail.com","login":"SSebo","count":1},{"name":"Suman Debnath","email":"56056673+debnsuma","login":"debnsuma","count":1},{"name":"Tao Qian","email":"taoxqian@gmail.com","login":"tao-qian","count":1},{"name":"Thanh Tran","email":"thanh.ptit.96@gmail.com","login":"thanhtcptit","count":1},{"name":"Tim Hopper","email":"tdhopper","login":"tdhopper","count":1},{"name":"Victor Skvortsov","email":"vds003@gmail.com","login":"r4victor","count":1},{"name":"ridhachahed","email":"31919686+ridhachahed","login":"ridhachahed","count":1},{"name":"rvaneijk","email":"rob@blaeu.com","login":"rvaneijk","count":1}],"past_year_total_commits":410,"past_year_total_committers":27,"past_year_total_bot_commits":0,"past_year_total_bot_committers":0,"past_year_mean_commits":15.185185185185185,"past_year_dds":0.19512195121951215,"last_synced_at":"2025-05-25T06:01:46.105Z","last_synced_commit":"c278745aff419ae6c1d6409ca4279aa57ea749e4","created_at":"2024-09-04T15:25:18.145Z","updated_at":"2025-05-25T06:01:46.143Z","commits_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub/repositories/rasbt%2FLLMs-from-scratch/commits","host":{"name":"GitHub","url":"https://github.com","kind":"github","last_synced_at":"2025-09-04T00:00:25.936Z","repositories_count":5480019,"commits_count":853389012,"contributors_count":31098138,"owners_count":906558,"icon_url":"https://github.com/github.png","host_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub/repositories"}},"issues_stats":{"full_name":"rasbt/LLMs-from-scratch","html_url":"https://github.com/rasbt/LLMs-from-scratch","last_synced_at":"2025-09-04T14:35:18.756Z","status":null,"issues_count":165,"pull_requests_count":624,"avg_time_to_close_issue":134122.78048780488,"avg_time_to_close_pull_request":32300.294326241135,"issues_closed_count":123,"pull_requests_closed_count":564,"pull_request_authors_count":77,"issue_authors_count":82,"avg_comments_per_issue":1.503030303030303,"avg_comments_per_pull_request":1.1346153846153846,"merged_pull_requests_count":493,"bot_issues_count":0,"bot_pull_requests_count":0,"past_year_issues_count":90,"past_year_pull_requests_count":364,"past_year_avg_time_to_close_issue":204906.86440677967,"past_year_avg_time_to_close_pull_request":42565.2523659306,"past_year_issues_closed_count":59,"past_year_pull_requests_closed_count":317,"past_year_pull_request_authors_count":46,"past_year_issue_authors_count":53,"past_year_avg_comments_per_issue":1.1444444444444444,"past_year_avg_comments_per_pull_request":0.9807692307692307,"past_year_bot_issues_count":0,"past_year_bot_pull_requests_count":0,"past_year_merged_pull_requests_count":276,"created_at":"2024-09-04T15:25:24.659Z","updated_at":"2025-09-04T14:35:18.757Z","repository_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/rasbt%2FLLMs-from-scratch","issues_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/rasbt%2FLLMs-from-scratch/issues","issue_labels_count":{"bug":57,"question":28,"enhancement":3,"documentation":2,"update":1,"text typo":1},"pull_request_labels_count":{"bug":1,"question":1},"issue_author_associations_count":{"NONE":116,"CONTRIBUTOR":46,"OWNER":3},"pull_request_author_associations_count":{"OWNER":354,"CONTRIBUTOR":171,"NONE":99},"issue_authors":{"labdmitriy":31,"d-kleine":31,"PrinceSajjadHussain":5,"jingedawang":3,"casinca":3,"rasbt":3,"weezymatt":3,"xyang2013":3,"RahulYadav-tech-gif":3,"WilliamLee30":2,"qibin0506":2,"athul-22":2,"vico":2,"EricTay1997":2,"frankchieng":2,"Intelligence-Manifesto":2,"quanquanQQ":1,"Tsumugii24":1,"Linsen-gao-457":1,"vaifai":1,"listaction":1,"haiduo":1,"daddygongon":1,"younesselbrag":1,"navneethc":1,"rkinas":1,"axinging":1,"kevalshah90":1,"PSLHimaBindu":1,"chsharma27":1,"krikru":1,"AldawsariNLP":1,"gcapuzzi":1,"sirchristian":1,"taihaozesong":1,"montag":1,"DanielRojas20":1,"amani1874":1,"hanjr92":1,"KK666-AI":1,"b3ops":1,"mnuman":1,"zia-hasan":1,"lgmoneda":1,"Safarveisi":1,"TimRepke":1,"BuissonFlorent":1,"Gorock":1,"bpalmer7440":1,"cahya-wirawan":1,"charbull":1,"Akshat-Shu":1,"mikaylagawarecki":1,"Jessen-Li":1,"minaf1":1,"yuyi2439":1,"bjpcjp":1,"TITC":1,"xfpg21421":1,"npuichigo":1,"dengyunsheng250":1,"shivam-chandhok":1,"YinSonglin1997":1,"BaixiangZ":1,"ziqiyang107":1,"galopyz":1,"lmw4051":1,"Ameet1992":1,"verhas":1,"gustavomr":1,"dhruv20047228":1,"SeriousJ55":1,"ChenLi2049":1,"satyamedidi":1,"tt7533":1,"DesmondChoy":1,"InTheCloudDan":1,"Iosifts":1,"nithiyn":1,"itdxer":1,"Learn2Solve":1,"jameslholcombe":1},"pull_request_authors":{"rasbt":354,"d-kleine":83,"Intelligence-Manifesto":21,"casinca":11,"ziqiyang107":7,"TITC":7,"gsganden":6,"rayed-therap":6,"rayedbw":6,"weezymatt":5,"eltociear":5,"conglt-0917":4,"imkasen":4,"jinesh90":4,"henrythe9th":4,"jingedawang":3,"debnsuma":3,"helloboyn":2,"Hasan-75":2,"hammer":2,"taihaozesong":2,"xukai286":2,"tao-qian":2,"shimkoji":2,"rohanwinsor":2,"bkentropy":2,"rvaneijk":2,"shenxiangzhuang":2,"r4victor":2,"ngbrown":2,"tdhopper":2,"lioda":2,"BartoszBLL":2,"gustavomr":2,"Shuyib":2,"BioGeek":2,"ductringuyen":2,"Linsen-gao-457":2,"ridhachahed":2,"joel-foo":2,"matthewfeickert":2,"wexhi":2,"austinmw":2,"NPrashanthReddy":2,"Mike-7777777":2,"mix16atpitt":2,"krouser":2,"QuantumBear":2,"JasonnnW3000":1,"EricThomson":1,"GiosueSglavo96":1,"Shashank204002":1,"ayan-chattaraj":1,"martinzwm":1,"speed1313":1,"TianYubo":1,"jjddbouhl":1,"pitmonticone":1,"MalikZeeshan1122":1,"anupsharma555":1,"xiaotian0328":1,"ilya-pi":1,"SSebo":1,"kuutsav":1,"kowy-liu":1,"PratyushSubhadarshi":1,"jameslholcombe":1,"jestinepaul":1,"netcan":1,"DrCesar":1,"AakashKumarNain":1,"PrinceSajjadHussain":1,"xinfeng-yes":1,"Shamik-07":1,"superkostya":1,"thanhtcptit":1,"ehberg":1},"host":{"name":"GitHub","url":"https://github.com","kind":"github","last_synced_at":"2025-09-04T00:00:25.939Z","repositories_count":10081478,"issues_count":31331220,"pull_requests_count":96240505,"authors_count":10693617,"icon_url":"https://github.com/github.png","host_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories","owners_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/owners","authors_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors"},"past_year_issue_labels_count":{"bug":36,"question":22,"documentation":2,"enhancement":2,"update":1,"text typo":1},"past_year_pull_request_labels_count":{},"past_year_issue_author_associations_count":{"NONE":55,"CONTRIBUTOR":33,"OWNER":2},"past_year_pull_request_author_associations_count":{"OWNER":221,"CONTRIBUTOR":75,"NONE":68},"past_year_issue_authors":{"d-kleine":23,"PrinceSajjadHussain":5,"xyang2013":3,"casinca":3,"weezymatt":3,"RahulYadav-tech-gif":3,"EricTay1997":2,"WilliamLee30":2,"rasbt":2,"Safarveisi":1,"rkinas":1,"quanquanQQ":1,"PSLHimaBindu":1,"nithiyn":1,"navneethc":1,"mnuman":1,"mikaylagawarecki":1,"SeriousJ55":1,"shivam-chandhok":1,"sirchristian":1,"tt7533":1,"vaifai":1,"verhas":1,"xfpg21421":1,"YinSonglin1997":1,"yuyi2439":1,"zia-hasan":1,"ziqiyang107":1,"Akshat-Shu":1,"AldawsariNLP":1,"amani1874":1,"BaixiangZ":1,"bpalmer7440":1,"BuissonFlorent":1,"cahya-wirawan":1,"charbull":1,"chsharma27":1,"daddygongon":1,"DanielRojas20":1,"dengyunsheng250":1,"dhruv20047228":1,"galopyz":1,"Gorock":1,"gustavomr":1,"haiduo":1,"Iosifts":1,"itdxer":1,"Jessen-Li":1,"jingedawang":1,"KK666-AI":1,"lgmoneda":1,"Linsen-gao-457":1,"lmw4051":1},"past_year_pull_request_authors":{"rasbt":221,"d-kleine":38,"casinca":11,"ziqiyang107":7,"gsganden":6,"weezymatt":5,"jinesh90":4,"conglt-0917":4,"imkasen":4,"henrythe9th":4,"austinmw":2,"gustavomr":2,"xukai286":2,"Hasan-75":2,"matthewfeickert":2,"r4victor":2,"helloboyn":2,"ridhachahed":2,"Linsen-gao-457":2,"wexhi":2,"ngbrown":2,"QuantumBear":2,"BartoszBLL":2,"lioda":2,"tdhopper":2,"NPrashanthReddy":2,"bkentropy":2,"krouser":2,"mix16atpitt":2,"Mike-7777777":2,"rohanwinsor":2,"tao-qian":2,"shimkoji":2,"rvaneijk":2,"TianYubo":1,"jingedawang":1,"JasonnnW3000":1,"jestinepaul":1,"anupsharma555":1,"martinzwm":1,"Shamik-07":1,"xinfeng-yes":1,"PratyushSubhadarshi":1,"PrinceSajjadHussain":1,"kowy-liu":1,"GiosueSglavo96":1},"maintainers":[{"login":"rasbt","count":357,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/rasbt"}],"active_maintainers":[{"login":"rasbt","count":223,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/rasbt"}]},"events":null,"keywords":["ai","artificial-intelligence","chatgpt","deep-learning","from-scratch","gpt","language-model","large-language-models","llm","machine-learning","python","pytorch","transformer"],"dependencies":[],"score":14.870622267906368,"created_at":"2025-09-04T15:50:15.944Z","updated_at":"2025-10-07T08:05:23.235Z","avatar_url":"https://github.com/rasbt.png","language":"Jupyter Notebook","category":null,"sub_category":null,"monthly_downloads":0,"funding_links":[],"readme_doi_urls":[],"works":{},"citation_counts":{},"total_citations":0,"keywords_from_contributors":["data-mining","jax"],"project_url":"https://science.ecosyste.ms/api/v1/projects/5458","html_url":"https://science.ecosyste.ms/projects/5458","bibtex_url":"https://science.ecosyste.ms/projects/5458/export.bibtex","apalike_url":"https://science.ecosyste.ms/projects/5458/export.apalike"}