{"id":54668,"name":"dolma","description":"Data and tools for generating and inspecting OLMo pre-training data. ","url":"https://github.com/allenai/dolma","last_synced_at":"2025-09-05T13:34:43.691Z","repository":{"id":177024402,"uuid":"656376920","full_name":"allenai/dolma","owner":"allenai","description":"Data and tools for generating and inspecting OLMo pre-training data. ","archived":false,"fork":false,"pushed_at":"2025-08-14T21:04:38.000Z","size":65827,"stargazers_count":1293,"open_issues_count":24,"forks_count":147,"subscribers_count":24,"default_branch":"main","last_synced_at":"2025-08-14T23:11:09.739Z","etag":null,"topics":["data-processing","large-language-models","llm","machile-learning","nlp"],"latest_commit_sha":null,"homepage":"https://allenai.github.io/dolma/","language":"Python","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"apache-2.0","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/allenai.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":"LICENSE","code_of_conduct":null,"threat_model":null,"audit":null,"citation":"CITATION.cff","codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null,"zenodo":null}},"created_at":"2023-06-20T20:37:39.000Z","updated_at":"2025-08-14T10:28:21.000Z","dependencies_parsed_at":"2024-02-06T02:25:09.492Z","dependency_job_id":"58c6becd-ceb3-4836-89a2-809ae8373107","html_url":"https://github.com/allenai/dolma","commit_stats":{"total_commits":283,"total_committers":22,"mean_commits":"12.863636363636363","dds":0.6890459363957597,"last_synced_commit":"4cf2d177add315de8e5f90bc6df861ed0c820eb4"},"previous_names":["allenai/dolma"],"tags_count":41,"template":false,"template_full_name":null,"purl":"pkg:github/allenai/dolma","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/allenai","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/refs/heads/main","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/sbom","scorecard":null,"host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":273766015,"owners_count":25164254,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","status":"online","status_checked_at":"2025-09-05T02:00:09.113Z","response_time":402,"last_error":null,"robots_txt_status":"success","robots_txt_updated_at":"2025-07-24T06:49:26.215Z","robots_txt_url":"https://github.com/robots.txt","online":true,"can_crawl_api":true,"host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"owner":{"login":"allenai","name":"AI2","uuid":"5667695","kind":"organization","description":"","email":"ai2-info@allenai.org","website":"http://www.allenai.org","location":"Seattle, WA","twitter":null,"company":null,"icon_url":"https://avatars.githubusercontent.com/u/5667695?v=4","repositories_count":454,"last_synced_at":"2024-04-14T22:06:46.803Z","metadata":{"has_sponsors_listing":false},"html_url":"https://github.com/allenai","funding_links":[],"total_stars":58847,"followers":1621,"following":0,"created_at":"2022-11-06T17:18:34.185Z","updated_at":"2024-04-14T22:08:05.570Z","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/allenai","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/allenai/repositories"},"packages":[{"id":11709419,"name":"github.com/allenai/dolma","ecosystem":"go","description":null,"homepage":null,"licenses":"apache-2.0","normalized_licenses":["Apache-2.0"],"repository_url":"https://github.com/allenai/dolma","keywords_array":[],"namespace":null,"versions_count":38,"first_release_published_at":"2023-07-10T01:20:06.000Z","latest_release_published_at":"2025-06-25T18:52:53.000Z","latest_release_number":"v1.2.1","last_synced_at":"2025-08-14T23:19:14.125Z","created_at":"2025-05-30T10:33:15.470Z","updated_at":"2025-08-15T03:51:11.049Z","registry_url":"https://pkg.go.dev/github.com/allenai/dolma","install_command":"go get github.com/allenai/dolma","documentation_url":"https://pkg.go.dev/github.com/allenai/dolma#section-documentation","metadata":{},"repo_metadata":{"id":177024402,"uuid":"656376920","full_name":"allenai/dolma","owner":"allenai","description":"Data and tools for generating and inspecting OLMo pre-training data. ","archived":false,"fork":false,"pushed_at":"2025-08-14T21:04:38.000Z","size":65827,"stargazers_count":1293,"open_issues_count":24,"forks_count":147,"subscribers_count":24,"default_branch":"main","last_synced_at":"2025-08-14T23:11:09.739Z","etag":null,"topics":["data-processing","large-language-models","llm","machile-learning","nlp"],"latest_commit_sha":null,"homepage":"https://allenai.github.io/dolma/","language":"Python","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"apache-2.0","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/allenai.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":"LICENSE","code_of_conduct":null,"threat_model":null,"audit":null,"citation":"CITATION.cff","codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null,"zenodo":null}},"created_at":"2023-06-20T20:37:39.000Z","updated_at":"2025-08-14T10:28:21.000Z","dependencies_parsed_at":"2024-02-06T02:25:09.492Z","dependency_job_id":"58c6becd-ceb3-4836-89a2-809ae8373107","html_url":"https://github.com/allenai/dolma","commit_stats":{"total_commits":283,"total_committers":22,"mean_commits":"12.863636363636363","dds":0.6890459363957597,"last_synced_commit":"4cf2d177add315de8e5f90bc6df861ed0c820eb4"},"previous_names":["allenai/dolma"],"tags_count":41,"template":false,"template_full_name":null,"purl":"pkg:github/allenai/dolma","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/allenai","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/refs/heads/main","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/sbom","scorecard":null,"host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":270519905,"owners_count":24599253,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","status":"online","status_checked_at":"2025-08-15T02:00:12.559Z","response_time":110,"last_error":null,"robots_txt_status":"success","robots_txt_updated_at":"2025-07-24T06:49:26.215Z","robots_txt_url":"https://github.com/robots.txt","online":true,"can_crawl_api":true,"host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"},"owner_record":{"login":"allenai","name":"AI2","uuid":"5667695","kind":"organization","description":"","email":"ai2-info@allenai.org","website":"http://www.allenai.org","location":"Seattle, WA","twitter":null,"company":null,"icon_url":"https://avatars.githubusercontent.com/u/5667695?v=4","repositories_count":454,"last_synced_at":"2024-04-14T22:06:46.803Z","metadata":{"has_sponsors_listing":false},"html_url":"https://github.com/allenai","funding_links":[],"total_stars":58847,"followers":1621,"following":0,"created_at":"2022-11-06T17:18:34.185Z","updated_at":"2024-04-14T22:08:05.570Z","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/allenai","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/allenai/repositories"},"tags":[{"name":"v1.2.1","sha":"fd22a34972a36bf1a60d2f161533d55b2be4c047","kind":"commit","published_at":"2025-06-25T18:52:53.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.2.1","html_url":"https://github.com/allenai/dolma/releases/tag/v1.2.1","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.2.1","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.1","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.1/manifests"},{"name":"v1.2.0","sha":"f66cd3ffa397a56c616a63bcfc1ec06a17908d5f","kind":"commit","published_at":"2025-06-03T01:06:25.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.2.0","html_url":"https://github.com/allenai/dolma/releases/tag/v1.2.0","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.2.0","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0/manifests"},{"name":"v1.2.0-dev8","sha":"eb65611fcd35644157c44481f0be2cc15c501be3","kind":"commit","published_at":"2025-04-04T17:00:18.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.2.0-dev8","html_url":"https://github.com/allenai/dolma/releases/tag/v1.2.0-dev8","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.2.0-dev8","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev8","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev8/manifests"},{"name":"1.2.0.dev7","sha":"e9527ebf241b6576e56a4a92826bd898a5f48350","kind":"commit","published_at":"2025-03-05T18:11:21.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/1.2.0.dev7","html_url":"https://github.com/allenai/dolma/releases/tag/1.2.0.dev7","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@1.2.0.dev7","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/1.2.0.dev7","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/1.2.0.dev7/manifests"},{"name":"v1.1.2","sha":"3916871f53bee9244abcc964c717a631846e9174","kind":"commit","published_at":"2025-02-20T00:40:24.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.1.2","html_url":"https://github.com/allenai/dolma/releases/tag/v1.1.2","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.1.2","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.1.2","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.1.2/manifests"},{"name":"v1.1.1.post3","sha":"17242c32b1fb117e430c7325e64ad250115b37ce","kind":"commit","published_at":"2025-02-14T00:57:24.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.1.1.post3","html_url":"https://github.com/allenai/dolma/releases/tag/v1.1.1.post3","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.1.1.post3","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.1.1.post3","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.1.1.post3/manifests"},{"name":"v1.2.0-dev6","sha":"81711b885ae9e26ead2061b8d45770eb36a644b3","kind":"commit","published_at":"2025-02-13T23:15:05.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.2.0-dev6","html_url":"https://github.com/allenai/dolma/releases/tag/v1.2.0-dev6","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.2.0-dev6","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev6","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev6/manifests"},{"name":"v1.2.0-dev5","sha":"8d50f74f8b8168724a4f955aa009e25d655d49c7","kind":"commit","published_at":"2025-02-13T21:45:27.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.2.0-dev5","html_url":"https://github.com/allenai/dolma/releases/tag/v1.2.0-dev5","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.2.0-dev5","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev5","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev5/manifests"},{"name":"v1.2.0-dev4","sha":"6eaf41e4eb4fd7f07395278ddd2ee04523f5756e","kind":"commit","published_at":"2025-02-13T21:20:08.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.2.0-dev4","html_url":"https://github.com/allenai/dolma/releases/tag/v1.2.0-dev4","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.2.0-dev4","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev4","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev4/manifests"},{"name":"v1.2.0-dev3","sha":"eef699858883202d5cf10eb711386c9aa98a8eda","kind":"commit","published_at":"2025-02-13T21:01:05.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.2.0-dev3","html_url":"https://github.com/allenai/dolma/releases/tag/v1.2.0-dev3","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.2.0-dev3","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev3","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev3/manifests"},{"name":"v1.2.0-dev2","sha":"2659e3d71b1561902026e8739bb99407e303492b","kind":"commit","published_at":"2025-02-13T20:27:57.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.2.0-dev2","html_url":"https://github.com/allenai/dolma/releases/tag/v1.2.0-dev2","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.2.0-dev2","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev2","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev2/manifests"},{"name":"v1.1.1","sha":"704e8b0757fa7e08b6cff2dc62dd58c99bc39f67","kind":"commit","published_at":"2025-02-13T20:21:28.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.1.1","html_url":"https://github.com/allenai/dolma/releases/tag/v1.1.1","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.1.1","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.1.1","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.1.1/manifests"},{"name":"v1.2.0-dev1","sha":"a2bd2eea7ff0ce1400f610c68747f0ca5cd81c95","kind":"commit","published_at":"2025-02-13T19:51:51.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.2.0-dev1","html_url":"https://github.com/allenai/dolma/releases/tag/v1.2.0-dev1","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.2.0-dev1","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev1","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev1/manifests"},{"name":"v1.2.0-dev0","sha":"cdaf1a65ffbe3a8b7bb21f45234c1d4c9fa501cf","kind":"commit","published_at":"2025-02-13T19:27:45.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.2.0-dev0","html_url":"https://github.com/allenai/dolma/releases/tag/v1.2.0-dev0","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.2.0-dev0","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev0","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev0/manifests"},{"name":"v1.1.0","sha":"a8242205733d6df988b2fa04a96ac0779f277972","kind":"commit","published_at":"2024-12-02T16:45:49.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.1.0","html_url":"https://github.com/allenai/dolma/releases/tag/v1.1.0","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.1.0","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.1.0","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.1.0/manifests"},{"name":"v1.0.14.post1","sha":"c029e94445290d79ae4ee293e5bf5645b5cacfa9","kind":"commit","published_at":"2024-09-24T23:53:00.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.14.post1","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.14.post1","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.14.post1","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.14.post1","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.14.post1/manifests"},{"name":"v1.0.14","sha":"06d521d11a2a39d49cec467eba4e407f0d21a731","kind":"commit","published_at":"2024-09-24T20:08:31.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.14","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.14","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.14","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.14","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.14/manifests"},{"name":"v1.0.13","sha":"8a3c05818009927c7ed644b60394278e8cb3c02e","kind":"commit","published_at":"2024-09-20T20:53:49.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.13","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.13","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.13","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.13","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.13/manifests"},{"name":"v1.0.12","sha":"2a4ef7053a01ff5f08a170e14f88a9211954b1f1","kind":"commit","published_at":"2024-08-28T22:41:30.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.12","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.12","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.12","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.12","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.12/manifests"},{"name":"v1.0.11","sha":"16452bbb66a33aa9e988eec13b143fd96531251a","kind":"commit","published_at":"2024-08-22T01:05:53.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.11","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.11","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.11","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.11","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.11/manifests"},{"name":"v1.0.10","sha":"f365470031b615097e9c8f9ccb167dc35714f1fa","kind":"commit","published_at":"2024-08-17T21:24:29.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.10","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.10","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.10","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.10","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.10/manifests"},{"name":"v1.0.9","sha":"c4fa395c8fc7782c9d112b66f6e1c46e0b945a5a","kind":"commit","published_at":"2024-08-11T01:17:55.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.9","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.9","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.9","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.9","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.9/manifests"},{"name":"v1.0.8","sha":"4322ad0db0a1938a0f30ea43ac0bebe04289410e","kind":"commit","published_at":"2024-08-06T23:01:38.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.8","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.8","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.8","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.8","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.8/manifests"},{"name":"v1.0.7","sha":"abb67f749d1b83b763d69267d66b590d352a0214","kind":"commit","published_at":"2024-08-06T19:52:35.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.7","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.7","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.7","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.7","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.7/manifests"},{"name":"v1.0.6","sha":"a72c76b26b92e22eeab10905f76c739c73bf4535","kind":"commit","published_at":"2024-08-01T16:47:06.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.6","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.6","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.6","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.6","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.6/manifests"},{"name":"v1.0.5","sha":"a01a2229ea0626dfda243e1cc2e82afe53071a0a","kind":"commit","published_at":"2024-07-26T20:07:12.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.5","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.5","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.5","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.5","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.5/manifests"},{"name":"v1.0.4","sha":"5868453e7cda753af4bf66058c5518c017df8729","kind":"commit","published_at":"2024-07-24T19:01:56.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.4","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.4","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.4","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.4","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.4/manifests"},{"name":"v1.0.3","sha":"6673ad32f561c59a2c412f806385c3d7cc3681f3","kind":"commit","published_at":"2024-04-10T20:41:16.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.3","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.3","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.3","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.3","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.3/manifests"},{"name":"v1.0.2","sha":"4e1d17f091668abbc4748ef2ba2fd721d7e6144d","kind":"commit","published_at":"2024-03-21T16:44:51.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.2","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.2","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.2","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.2","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.2/manifests"},{"name":"v1.0.1","sha":"f6970d51ed14979a70bab7e3f5317d91c71e3eeb","kind":"commit","published_at":"2024-02-07T18:02:48.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.1","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.1","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.1","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.1","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.1/manifests"},{"name":"v1.0.0","sha":"a74b78ac531e06adb61bf70986c8d2a3ef38e9d7","kind":"commit","published_at":"2024-02-01T08:23:18.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.0","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.0","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.0","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.0","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.0/manifests"},{"name":"v0.9.4","sha":"a44489f056188e9598f14a78b0e4bb6c85779bec","kind":"commit","published_at":"2024-01-21T02:02:11.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v0.9.4","html_url":"https://github.com/allenai/dolma/releases/tag/v0.9.4","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v0.9.4","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.9.4","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.9.4/manifests"},{"name":"v0.9.2","sha":"ede739f367827101df2d150f68e897987bd3100e","kind":"commit","published_at":"2024-01-15T06:34:15.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v0.9.2","html_url":"https://github.com/allenai/dolma/releases/tag/v0.9.2","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v0.9.2","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.9.2","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.9.2/manifests"},{"name":"v0.9.1","sha":"2ee1ae27f32c09531699301ef8271a6cb45da2da","kind":"commit","published_at":"2023-10-26T04:55:15.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v0.9.1","html_url":"https://github.com/allenai/dolma/releases/tag/v0.9.1","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v0.9.1","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.9.1","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.9.1/manifests"},{"name":"v0.9.0","sha":"1728f4f5267360fa54662b8e01fc0efa6414e498","kind":"commit","published_at":"2023-10-15T19:25:51.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v0.9.0","html_url":"https://github.com/allenai/dolma/releases/tag/v0.9.0","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v0.9.0","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.9.0","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.9.0/manifests"},{"name":"v0.8.0","sha":"705d358cc5d2467c8ae0a703d3d27aded99d9c8f","kind":"commit","published_at":"2023-08-18T13:26:50.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v0.8.0","html_url":"https://github.com/allenai/dolma/releases/tag/v0.8.0","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v0.8.0","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.8.0","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.8.0/manifests"},{"name":"v0.7.0","sha":"a37e7c6b1c883aea84bd30e78dc6589859c881f5","kind":"commit","published_at":"2023-07-21T14:48:24.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v0.7.0","html_url":"https://github.com/allenai/dolma/releases/tag/v0.7.0","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v0.7.0","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.7.0","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.7.0/manifests"},{"name":"v0.6.5","sha":"10c296461306efa23b1ec74a2d75e2908195e185","kind":"commit","published_at":"2023-07-18T03:40:22.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v0.6.5","html_url":"https://github.com/allenai/dolma/releases/tag/v0.6.5","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v0.6.5","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.6.5","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.6.5/manifests"},{"name":"v0.6.4","sha":"9a04d9dbbdbb2066997e8d7394ba33f477917a10","kind":"commit","published_at":"2023-07-16T00:57:51.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v0.6.4","html_url":"https://github.com/allenai/dolma/releases/tag/v0.6.4","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v0.6.4","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.6.4","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.6.4/manifests"},{"name":"v0.6.3","sha":"422800251c7a3ff1ca6201aab77b06ef2a746574","kind":"commit","published_at":"2023-07-11T00:01:11.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v0.6.3","html_url":"https://github.com/allenai/dolma/releases/tag/v0.6.3","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v0.6.3","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.6.3","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.6.3/manifests"},{"name":"v0.6.2","sha":"eb572198865204924bd6c2ae185a3581a03a1474","kind":"commit","published_at":"2023-07-10T01:20:06.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v0.6.2","html_url":"https://github.com/allenai/dolma/releases/tag/v0.6.2","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v0.6.2","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.6.2","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.6.2/manifests"}]},"repo_metadata_updated_at":"2025-08-15T03:51:11.049Z","dependent_packages_count":0,"downloads":null,"downloads_period":null,"dependent_repos_count":0,"rankings":{"downloads":null,"dependent_repos_count":5.784814001734242,"dependent_packages_count":5.420815499828766,"stargazers_count":null,"forks_count":null,"docker_downloads_count":null,"average":5.602814750781504},"purl":"pkg:golang/github.com/allenai/dolma","advisories":[],"docker_usage_url":"https://docker.ecosyste.ms/usage/go/github.com/allenai/dolma","docker_dependents_count":null,"docker_downloads_count":null,"usage_url":"https://repos.ecosyste.ms/usage/go/github.com/allenai/dolma","dependent_repositories_url":"https://repos.ecosyste.ms/api/v1/usage/go/github.com/allenai/dolma/dependencies","status":null,"funding_links":[],"critical":null,"issue_metadata":{"last_synced_at":"2025-08-01T23:19:12.133Z","issues_count":114,"pull_requests_count":189,"avg_time_to_close_issue":9619177.35,"avg_time_to_close_pull_request":822295.1724137932,"issues_closed_count":100,"pull_requests_closed_count":174,"pull_request_authors_count":30,"issue_authors_count":46,"avg_comments_per_issue":1.8245614035087718,"avg_comments_per_pull_request":0.3915343915343915,"merged_pull_requests_count":158,"bot_issues_count":0,"bot_pull_requests_count":12,"past_year_issues_count":20,"past_year_pull_requests_count":49,"past_year_avg_time_to_close_issue":7721022.125,"past_year_avg_time_to_close_pull_request":1067314.6666666667,"past_year_issues_closed_count":16,"past_year_pull_requests_closed_count":39,"past_year_pull_request_authors_count":14,"past_year_issue_authors_count":17,"past_year_avg_comments_per_issue":1.75,"past_year_avg_comments_per_pull_request":0.16326530612244897,"past_year_bot_issues_count":0,"past_year_bot_pull_requests_count":3,"past_year_merged_pull_requests_count":36,"issues_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/issues","maintainers":[{"login":"soldni","count":90,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/soldni"},{"login":"kyleclo","count":6,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/kyleclo"},{"login":"rodneykinney","count":3,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/rodneykinney"},{"login":"aman-17","count":1,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/aman-17"},{"login":"dirkgr","count":1,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/dirkgr"},{"login":"epwalsh","count":1,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/epwalsh"}],"active_maintainers":[{"login":"soldni","count":17,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/soldni"},{"login":"aman-17","count":1,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/aman-17"},{"login":"epwalsh","count":1,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/epwalsh"},{"login":"kyleclo","count":1,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/kyleclo"}]},"versions_url":"https://packages.ecosyste.ms/api/v1/registries/proxy.golang.org/packages/github.com%2Fallenai%2Fdolma/versions","version_numbers_url":"https://packages.ecosyste.ms/api/v1/registries/proxy.golang.org/packages/github.com%2Fallenai%2Fdolma/version_numbers","dependent_packages_url":"https://packages.ecosyste.ms/api/v1/registries/proxy.golang.org/packages/github.com%2Fallenai%2Fdolma/dependent_packages","related_packages_url":"https://packages.ecosyste.ms/api/v1/registries/proxy.golang.org/packages/github.com%2Fallenai%2Fdolma/related_packages","maintainers":[],"registry":{"name":"proxy.golang.org","url":"https://proxy.golang.org","ecosystem":"go","default":true,"packages_count":1952121,"maintainers_count":0,"namespaces_count":741275,"keywords_count":109185,"github":"golang","metadata":{"funded_packages_count":49011},"icon_url":"https://github.com/golang.png","created_at":"2022-04-04T15:19:22.939Z","updated_at":"2025-09-05T05:14:06.439Z","packages_url":"https://packages.ecosyste.ms/api/v1/registries/proxy.golang.org/packages","maintainers_url":"https://packages.ecosyste.ms/api/v1/registries/proxy.golang.org/maintainers","namespaces_url":"https://packages.ecosyste.ms/api/v1/registries/proxy.golang.org/namespaces"}},{"id":7908501,"name":"dolma","ecosystem":"pypi","description":"Toolkit for pre-processing LLM training data.","homepage":"https://github.com/allenai/dolma","licenses":"Apache-2.0","normalized_licenses":["Apache-2.0"],"repository_url":"https://github.com/allenai/dolma","keywords_array":[],"namespace":null,"versions_count":41,"first_release_published_at":"2023-07-09T03:51:38.000Z","latest_release_published_at":"2025-07-07T16:02:52.000Z","latest_release_number":"1.2.1","last_synced_at":"2025-08-14T23:19:13.974Z","created_at":"2023-07-09T04:21:16.356Z","updated_at":"2025-08-15T03:51:11.627Z","registry_url":"https://pypi.org/project/dolma/","install_command":"pip install dolma --index-url https://pypi.org/simple","documentation_url":"https://dolma.readthedocs.io/","metadata":{"funding":null,"documentation":null,"classifiers":["Development Status :: 5 - Production/Stable","Intended Audience :: Science/Research","License :: OSI Approved :: Apache Software License","Programming Language :: Python :: Implementation :: CPython","Programming Language :: Rust","Topic :: Scientific/Engineering :: Artificial Intelligence","Topic :: Text Processing","Typing :: Typed"],"normalized_name":"dolma"},"repo_metadata":{"id":177024402,"uuid":"656376920","full_name":"allenai/dolma","owner":"allenai","description":"Data and tools for generating and inspecting OLMo pre-training data. ","archived":false,"fork":false,"pushed_at":"2025-08-14T21:04:38.000Z","size":65827,"stargazers_count":1293,"open_issues_count":24,"forks_count":147,"subscribers_count":24,"default_branch":"main","last_synced_at":"2025-08-14T23:11:09.739Z","etag":null,"topics":["data-processing","large-language-models","llm","machile-learning","nlp"],"latest_commit_sha":null,"homepage":"https://allenai.github.io/dolma/","language":"Python","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"apache-2.0","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/allenai.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":"LICENSE","code_of_conduct":null,"threat_model":null,"audit":null,"citation":"CITATION.cff","codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null,"zenodo":null}},"created_at":"2023-06-20T20:37:39.000Z","updated_at":"2025-08-14T10:28:21.000Z","dependencies_parsed_at":"2024-02-06T02:25:09.492Z","dependency_job_id":"58c6becd-ceb3-4836-89a2-809ae8373107","html_url":"https://github.com/allenai/dolma","commit_stats":{"total_commits":283,"total_committers":22,"mean_commits":"12.863636363636363","dds":0.6890459363957597,"last_synced_commit":"4cf2d177add315de8e5f90bc6df861ed0c820eb4"},"previous_names":["allenai/dolma"],"tags_count":41,"template":false,"template_full_name":null,"purl":"pkg:github/allenai/dolma","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/allenai","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/refs/heads/main","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/sbom","scorecard":null,"host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":270519905,"owners_count":24599253,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","status":"online","status_checked_at":"2025-08-15T02:00:12.559Z","response_time":110,"last_error":null,"robots_txt_status":"success","robots_txt_updated_at":"2025-07-24T06:49:26.215Z","robots_txt_url":"https://github.com/robots.txt","online":true,"can_crawl_api":true,"host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"},"owner_record":{"login":"allenai","name":"AI2","uuid":"5667695","kind":"organization","description":"","email":"ai2-info@allenai.org","website":"http://www.allenai.org","location":"Seattle, WA","twitter":null,"company":null,"icon_url":"https://avatars.githubusercontent.com/u/5667695?v=4","repositories_count":454,"last_synced_at":"2024-04-14T22:06:46.803Z","metadata":{"has_sponsors_listing":false},"html_url":"https://github.com/allenai","funding_links":[],"total_stars":58847,"followers":1621,"following":0,"created_at":"2022-11-06T17:18:34.185Z","updated_at":"2024-04-14T22:08:05.570Z","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/allenai","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/allenai/repositories"},"tags":[{"name":"v1.2.1","sha":"fd22a34972a36bf1a60d2f161533d55b2be4c047","kind":"commit","published_at":"2025-06-25T18:52:53.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.2.1","html_url":"https://github.com/allenai/dolma/releases/tag/v1.2.1","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.2.1","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.1","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.1/manifests"},{"name":"v1.2.0","sha":"f66cd3ffa397a56c616a63bcfc1ec06a17908d5f","kind":"commit","published_at":"2025-06-03T01:06:25.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.2.0","html_url":"https://github.com/allenai/dolma/releases/tag/v1.2.0","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.2.0","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0/manifests"},{"name":"v1.2.0-dev8","sha":"eb65611fcd35644157c44481f0be2cc15c501be3","kind":"commit","published_at":"2025-04-04T17:00:18.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.2.0-dev8","html_url":"https://github.com/allenai/dolma/releases/tag/v1.2.0-dev8","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.2.0-dev8","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev8","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev8/manifests"},{"name":"1.2.0.dev7","sha":"e9527ebf241b6576e56a4a92826bd898a5f48350","kind":"commit","published_at":"2025-03-05T18:11:21.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/1.2.0.dev7","html_url":"https://github.com/allenai/dolma/releases/tag/1.2.0.dev7","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@1.2.0.dev7","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/1.2.0.dev7","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/1.2.0.dev7/manifests"},{"name":"v1.1.2","sha":"3916871f53bee9244abcc964c717a631846e9174","kind":"commit","published_at":"2025-02-20T00:40:24.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.1.2","html_url":"https://github.com/allenai/dolma/releases/tag/v1.1.2","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.1.2","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.1.2","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.1.2/manifests"},{"name":"v1.1.1.post3","sha":"17242c32b1fb117e430c7325e64ad250115b37ce","kind":"commit","published_at":"2025-02-14T00:57:24.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.1.1.post3","html_url":"https://github.com/allenai/dolma/releases/tag/v1.1.1.post3","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.1.1.post3","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.1.1.post3","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.1.1.post3/manifests"},{"name":"v1.2.0-dev6","sha":"81711b885ae9e26ead2061b8d45770eb36a644b3","kind":"commit","published_at":"2025-02-13T23:15:05.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.2.0-dev6","html_url":"https://github.com/allenai/dolma/releases/tag/v1.2.0-dev6","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.2.0-dev6","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev6","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev6/manifests"},{"name":"v1.2.0-dev5","sha":"8d50f74f8b8168724a4f955aa009e25d655d49c7","kind":"commit","published_at":"2025-02-13T21:45:27.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.2.0-dev5","html_url":"https://github.com/allenai/dolma/releases/tag/v1.2.0-dev5","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.2.0-dev5","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev5","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev5/manifests"},{"name":"v1.2.0-dev4","sha":"6eaf41e4eb4fd7f07395278ddd2ee04523f5756e","kind":"commit","published_at":"2025-02-13T21:20:08.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.2.0-dev4","html_url":"https://github.com/allenai/dolma/releases/tag/v1.2.0-dev4","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.2.0-dev4","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev4","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev4/manifests"},{"name":"v1.2.0-dev3","sha":"eef699858883202d5cf10eb711386c9aa98a8eda","kind":"commit","published_at":"2025-02-13T21:01:05.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.2.0-dev3","html_url":"https://github.com/allenai/dolma/releases/tag/v1.2.0-dev3","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.2.0-dev3","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev3","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev3/manifests"},{"name":"v1.2.0-dev2","sha":"2659e3d71b1561902026e8739bb99407e303492b","kind":"commit","published_at":"2025-02-13T20:27:57.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.2.0-dev2","html_url":"https://github.com/allenai/dolma/releases/tag/v1.2.0-dev2","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.2.0-dev2","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev2","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev2/manifests"},{"name":"v1.1.1","sha":"704e8b0757fa7e08b6cff2dc62dd58c99bc39f67","kind":"commit","published_at":"2025-02-13T20:21:28.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.1.1","html_url":"https://github.com/allenai/dolma/releases/tag/v1.1.1","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.1.1","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.1.1","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.1.1/manifests"},{"name":"v1.2.0-dev1","sha":"a2bd2eea7ff0ce1400f610c68747f0ca5cd81c95","kind":"commit","published_at":"2025-02-13T19:51:51.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.2.0-dev1","html_url":"https://github.com/allenai/dolma/releases/tag/v1.2.0-dev1","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.2.0-dev1","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev1","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev1/manifests"},{"name":"v1.2.0-dev0","sha":"cdaf1a65ffbe3a8b7bb21f45234c1d4c9fa501cf","kind":"commit","published_at":"2025-02-13T19:27:45.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.2.0-dev0","html_url":"https://github.com/allenai/dolma/releases/tag/v1.2.0-dev0","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.2.0-dev0","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev0","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.2.0-dev0/manifests"},{"name":"v1.1.0","sha":"a8242205733d6df988b2fa04a96ac0779f277972","kind":"commit","published_at":"2024-12-02T16:45:49.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.1.0","html_url":"https://github.com/allenai/dolma/releases/tag/v1.1.0","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.1.0","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.1.0","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.1.0/manifests"},{"name":"v1.0.14.post1","sha":"c029e94445290d79ae4ee293e5bf5645b5cacfa9","kind":"commit","published_at":"2024-09-24T23:53:00.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.14.post1","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.14.post1","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.14.post1","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.14.post1","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.14.post1/manifests"},{"name":"v1.0.14","sha":"06d521d11a2a39d49cec467eba4e407f0d21a731","kind":"commit","published_at":"2024-09-24T20:08:31.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.14","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.14","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.14","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.14","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.14/manifests"},{"name":"v1.0.13","sha":"8a3c05818009927c7ed644b60394278e8cb3c02e","kind":"commit","published_at":"2024-09-20T20:53:49.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.13","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.13","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.13","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.13","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.13/manifests"},{"name":"v1.0.12","sha":"2a4ef7053a01ff5f08a170e14f88a9211954b1f1","kind":"commit","published_at":"2024-08-28T22:41:30.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.12","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.12","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.12","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.12","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.12/manifests"},{"name":"v1.0.11","sha":"16452bbb66a33aa9e988eec13b143fd96531251a","kind":"commit","published_at":"2024-08-22T01:05:53.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.11","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.11","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.11","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.11","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.11/manifests"},{"name":"v1.0.10","sha":"f365470031b615097e9c8f9ccb167dc35714f1fa","kind":"commit","published_at":"2024-08-17T21:24:29.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.10","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.10","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.10","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.10","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.10/manifests"},{"name":"v1.0.9","sha":"c4fa395c8fc7782c9d112b66f6e1c46e0b945a5a","kind":"commit","published_at":"2024-08-11T01:17:55.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.9","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.9","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.9","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.9","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.9/manifests"},{"name":"v1.0.8","sha":"4322ad0db0a1938a0f30ea43ac0bebe04289410e","kind":"commit","published_at":"2024-08-06T23:01:38.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.8","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.8","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.8","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.8","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.8/manifests"},{"name":"v1.0.7","sha":"abb67f749d1b83b763d69267d66b590d352a0214","kind":"commit","published_at":"2024-08-06T19:52:35.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.7","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.7","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.7","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.7","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.7/manifests"},{"name":"v1.0.6","sha":"a72c76b26b92e22eeab10905f76c739c73bf4535","kind":"commit","published_at":"2024-08-01T16:47:06.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.6","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.6","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.6","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.6","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.6/manifests"},{"name":"v1.0.5","sha":"a01a2229ea0626dfda243e1cc2e82afe53071a0a","kind":"commit","published_at":"2024-07-26T20:07:12.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.5","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.5","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.5","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.5","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.5/manifests"},{"name":"v1.0.4","sha":"5868453e7cda753af4bf66058c5518c017df8729","kind":"commit","published_at":"2024-07-24T19:01:56.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.4","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.4","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.4","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.4","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.4/manifests"},{"name":"v1.0.3","sha":"6673ad32f561c59a2c412f806385c3d7cc3681f3","kind":"commit","published_at":"2024-04-10T20:41:16.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.3","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.3","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.3","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.3","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.3/manifests"},{"name":"v1.0.2","sha":"4e1d17f091668abbc4748ef2ba2fd721d7e6144d","kind":"commit","published_at":"2024-03-21T16:44:51.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.2","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.2","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.2","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.2","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.2/manifests"},{"name":"v1.0.1","sha":"f6970d51ed14979a70bab7e3f5317d91c71e3eeb","kind":"commit","published_at":"2024-02-07T18:02:48.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.1","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.1","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.1","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.1","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.1/manifests"},{"name":"v1.0.0","sha":"a74b78ac531e06adb61bf70986c8d2a3ef38e9d7","kind":"commit","published_at":"2024-02-01T08:23:18.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v1.0.0","html_url":"https://github.com/allenai/dolma/releases/tag/v1.0.0","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v1.0.0","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.0","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v1.0.0/manifests"},{"name":"v0.9.4","sha":"a44489f056188e9598f14a78b0e4bb6c85779bec","kind":"commit","published_at":"2024-01-21T02:02:11.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v0.9.4","html_url":"https://github.com/allenai/dolma/releases/tag/v0.9.4","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v0.9.4","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.9.4","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.9.4/manifests"},{"name":"v0.9.2","sha":"ede739f367827101df2d150f68e897987bd3100e","kind":"commit","published_at":"2024-01-15T06:34:15.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v0.9.2","html_url":"https://github.com/allenai/dolma/releases/tag/v0.9.2","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v0.9.2","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.9.2","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.9.2/manifests"},{"name":"v0.9.1","sha":"2ee1ae27f32c09531699301ef8271a6cb45da2da","kind":"commit","published_at":"2023-10-26T04:55:15.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v0.9.1","html_url":"https://github.com/allenai/dolma/releases/tag/v0.9.1","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v0.9.1","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.9.1","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.9.1/manifests"},{"name":"v0.9.0","sha":"1728f4f5267360fa54662b8e01fc0efa6414e498","kind":"commit","published_at":"2023-10-15T19:25:51.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v0.9.0","html_url":"https://github.com/allenai/dolma/releases/tag/v0.9.0","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v0.9.0","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.9.0","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.9.0/manifests"},{"name":"v0.8.0","sha":"705d358cc5d2467c8ae0a703d3d27aded99d9c8f","kind":"commit","published_at":"2023-08-18T13:26:50.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v0.8.0","html_url":"https://github.com/allenai/dolma/releases/tag/v0.8.0","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v0.8.0","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.8.0","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.8.0/manifests"},{"name":"v0.7.0","sha":"a37e7c6b1c883aea84bd30e78dc6589859c881f5","kind":"commit","published_at":"2023-07-21T14:48:24.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v0.7.0","html_url":"https://github.com/allenai/dolma/releases/tag/v0.7.0","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v0.7.0","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.7.0","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.7.0/manifests"},{"name":"v0.6.5","sha":"10c296461306efa23b1ec74a2d75e2908195e185","kind":"commit","published_at":"2023-07-18T03:40:22.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v0.6.5","html_url":"https://github.com/allenai/dolma/releases/tag/v0.6.5","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v0.6.5","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.6.5","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.6.5/manifests"},{"name":"v0.6.4","sha":"9a04d9dbbdbb2066997e8d7394ba33f477917a10","kind":"commit","published_at":"2023-07-16T00:57:51.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v0.6.4","html_url":"https://github.com/allenai/dolma/releases/tag/v0.6.4","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v0.6.4","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.6.4","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.6.4/manifests"},{"name":"v0.6.3","sha":"422800251c7a3ff1ca6201aab77b06ef2a746574","kind":"commit","published_at":"2023-07-11T00:01:11.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v0.6.3","html_url":"https://github.com/allenai/dolma/releases/tag/v0.6.3","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v0.6.3","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.6.3","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.6.3/manifests"},{"name":"v0.6.2","sha":"eb572198865204924bd6c2ae185a3581a03a1474","kind":"commit","published_at":"2023-07-10T01:20:06.000Z","download_url":"https://codeload.github.com/allenai/dolma/tar.gz/v0.6.2","html_url":"https://github.com/allenai/dolma/releases/tag/v0.6.2","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/allenai/dolma@v0.6.2","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.6.2","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/tags/v0.6.2/manifests"}]},"repo_metadata_updated_at":"2025-08-15T03:51:11.627Z","dependent_packages_count":0,"downloads":11143,"downloads_period":"last-month","dependent_repos_count":0,"rankings":{"downloads":5.225938320341463,"dependent_repos_count":69.80777363346114,"dependent_packages_count":7.490033931731681,"stargazers_count":4.879495498239574,"forks_count":10.61343680540663,"docker_downloads_count":null,"average":19.603335637836096},"purl":"pkg:pypi/dolma","advisories":[],"docker_usage_url":"https://docker.ecosyste.ms/usage/pypi/dolma","docker_dependents_count":null,"docker_downloads_count":null,"usage_url":"https://repos.ecosyste.ms/usage/pypi/dolma","dependent_repositories_url":"https://repos.ecosyste.ms/api/v1/usage/pypi/dolma/dependencies","status":null,"funding_links":[],"critical":null,"issue_metadata":{"last_synced_at":"2025-08-01T23:19:12.133Z","issues_count":114,"pull_requests_count":189,"avg_time_to_close_issue":9619177.35,"avg_time_to_close_pull_request":822295.1724137932,"issues_closed_count":100,"pull_requests_closed_count":174,"pull_request_authors_count":30,"issue_authors_count":46,"avg_comments_per_issue":1.8245614035087718,"avg_comments_per_pull_request":0.3915343915343915,"merged_pull_requests_count":158,"bot_issues_count":0,"bot_pull_requests_count":12,"past_year_issues_count":20,"past_year_pull_requests_count":49,"past_year_avg_time_to_close_issue":7721022.125,"past_year_avg_time_to_close_pull_request":1067314.6666666667,"past_year_issues_closed_count":16,"past_year_pull_requests_closed_count":39,"past_year_pull_request_authors_count":14,"past_year_issue_authors_count":17,"past_year_avg_comments_per_issue":1.75,"past_year_avg_comments_per_pull_request":0.16326530612244897,"past_year_bot_issues_count":0,"past_year_bot_pull_requests_count":3,"past_year_merged_pull_requests_count":36,"issues_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/issues","maintainers":[{"login":"soldni","count":90,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/soldni"},{"login":"kyleclo","count":6,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/kyleclo"},{"login":"rodneykinney","count":3,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/rodneykinney"},{"login":"aman-17","count":1,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/aman-17"},{"login":"dirkgr","count":1,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/dirkgr"},{"login":"epwalsh","count":1,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/epwalsh"}],"active_maintainers":[{"login":"soldni","count":17,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/soldni"},{"login":"aman-17","count":1,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/aman-17"},{"login":"epwalsh","count":1,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/epwalsh"},{"login":"kyleclo","count":1,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/kyleclo"}]},"versions_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/packages/dolma/versions","version_numbers_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/packages/dolma/version_numbers","dependent_packages_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/packages/dolma/dependent_packages","related_packages_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/packages/dolma/related_packages","maintainers":[{"uuid":"soldni","login":"soldni","name":null,"email":null,"url":null,"packages_count":21,"html_url":"https://pypi.org/user/soldni/","role":null,"created_at":"2023-07-09T04:21:21.207Z","updated_at":"2023-07-09T04:21:21.207Z","packages_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/maintainers/soldni/packages"},{"uuid":"kyleclo","login":"kyleclo","name":null,"email":null,"url":null,"packages_count":2,"html_url":"https://pypi.org/user/kyleclo/","role":null,"created_at":"2023-08-04T04:57:34.505Z","updated_at":"2023-08-04T04:57:34.505Z","packages_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/maintainers/kyleclo/packages"},{"uuid":"undfined","login":"undfined","name":null,"email":null,"url":null,"packages_count":1,"html_url":"https://pypi.org/user/undfined/","role":null,"created_at":"2024-09-25T07:43:46.402Z","updated_at":"2024-09-25T07:43:46.402Z","packages_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/maintainers/undfined/packages"}],"registry":{"name":"pypi.org","url":"https://pypi.org","ecosystem":"pypi","default":true,"packages_count":725151,"maintainers_count":308365,"namespaces_count":0,"keywords_count":238006,"github":"pypi","metadata":{"funded_packages_count":50519},"icon_url":"https://github.com/pypi.png","created_at":"2022-04-04T15:19:23.364Z","updated_at":"2025-09-05T05:40:58.860Z","packages_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/packages","maintainers_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/maintainers","namespaces_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/namespaces"}}],"commits":{"id":1462262,"full_name":"allenai/dolma","default_branch":"main","committers":[{"name":"Luca Soldaini","email":"lucas@allenai.org","login":null,"count":88},{"name":"Luca Soldaini","email":"luca@soldaini.net","login":null,"count":78},{"name":"chris-ha458","email":"hac541309@gmail.com","login":null,"count":69},{"name":"kyleclo","email":"kyleclo@uw.edu","login":null,"count":13},{"name":"dependabot[bot]","email":"49699333+dependabot[bot]","login":"dependabot[bot]","count":7},{"name":"Peter Bjørn Jørgensen","email":"peterbjorgensen@gmail.com","login":null,"count":5},{"name":"David Graham","email":"david.l.graham1@gmail.com","login":null,"count":3},{"name":"Niklas Muennighoff","email":"n.muennighoff@gmail.com","login":null,"count":3},{"name":"Tyler Murray","email":"tylerm@allenai.org","login":null,"count":3},{"name":"Rodney Kinney","email":"rodneyk@allenai.org","login":null,"count":2},{"name":"Arnavi Chheda","email":"arnavic@live.com","login":null,"count":1},{"name":"Ben Bogin","email":"benb969@gmail.com","login":null,"count":1},{"name":"Dirk Groeneveld","email":"dirkg@allenai.org","login":null,"count":1},{"name":"Ishan Anand","email":"github@ishan.org","login":null,"count":1},{"name":"Kenneth Enevoldsen","email":"kennethcenevoldsen@gmail.com","login":null,"count":1},{"name":"Rohit Singh Rathaur","email":"rohitrathore.imh55@gmail.com","login":null,"count":1},{"name":"Simon Willison","email":"swillison@gmail.com","login":null,"count":1},{"name":"Tyler Murray","email":"tylercmurray87@gmail.com","login":null,"count":1},{"name":"Ikko Eltociear Ashimine","email":"eltociear@gmail.com","login":"eltociear","count":1},{"name":"Ian Magnusson","email":"40903802+IanMagnusson","login":"IanMagnusson","count":1},{"name":"Dustin Schwenk","email":"drschwenk","login":"drschwenk","count":1},{"name":"epwalsh","email":"petew@allenai.org","login":null,"count":1}],"total_commits":283,"total_committers":22,"total_bot_commits":7,"total_bot_committers":1,"mean_commits":12.863636363636363,"dds":0.6890459363957597,"past_year_committers":[{"name":"chris-ha458","email":"hac541309@gmail.com","login":null,"count":69},{"name":"Luca Soldaini","email":"lucas@allenai.org","login":null,"count":38},{"name":"Luca Soldaini","email":"luca@soldaini.net","login":null,"count":33},{"name":"dependabot[bot]","email":"49699333+dependabot[bot]","login":"dependabot[bot]","count":7},{"name":"Peter Bjørn Jørgensen","email":"peterbjorgensen@gmail.com","login":null,"count":5},{"name":"David Graham","email":"david.l.graham1@gmail.com","login":null,"count":3},{"name":"Niklas Muennighoff","email":"n.muennighoff@gmail.com","login":null,"count":3},{"name":"Tyler Murray","email":"tylerm@allenai.org","login":null,"count":3},{"name":"Kyle Lo","email":"kyleclo@uw.edu","login":null,"count":2},{"name":"Arnavi Chheda","email":"arnavic@live.com","login":null,"count":1},{"name":"Ben Bogin","email":"benb969@gmail.com","login":null,"count":1},{"name":"Kenneth Enevoldsen","email":"kennethcenevoldsen@gmail.com","login":null,"count":1},{"name":"Rodney Kinney","email":"rodneyk@allenai.org","login":null,"count":1},{"name":"Rohit Singh Rathaur","email":"rohitrathore.imh55@gmail.com","login":null,"count":1},{"name":"Simon Willison","email":"swillison@gmail.com","login":null,"count":1},{"name":"Tyler Murray","email":"tylercmurray87@gmail.com","login":null,"count":1},{"name":"Ikko Eltociear Ashimine","email":"eltociear@gmail.com","login":"eltociear","count":1},{"name":"Ian Magnusson","email":"40903802+IanMagnusson","login":"IanMagnusson","count":1},{"name":"Dustin Schwenk","email":"drschwenk","login":"drschwenk","count":1},{"name":"epwalsh","email":"petew@allenai.org","login":null,"count":1}],"past_year_total_commits":174,"past_year_total_committers":20,"past_year_total_bot_commits":7,"past_year_total_bot_committers":1,"past_year_mean_commits":8.7,"past_year_dds":0.603448275862069,"last_synced_at":"2024-08-17T00:46:44.777Z","last_synced_commit":"4cf2d177add315de8e5f90bc6df861ed0c820eb4","created_at":"2024-01-04T00:14:25.538Z","updated_at":"2024-08-17T00:46:44.777Z","commits_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/commits","host":{"name":"GitHub","url":"https://github.com","kind":"github","last_synced_at":"2025-09-02T00:00:07.521Z","repositories_count":5480031,"commits_count":853395369,"contributors_count":31098267,"owners_count":906561,"icon_url":"https://github.com/github.png","host_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub/repositories"}},"issues_stats":{"full_name":"allenai/dolma","html_url":"https://github.com/allenai/dolma","last_synced_at":"2025-08-31T13:45:27.111Z","status":null,"issues_count":86,"pull_requests_count":185,"avg_time_to_close_issue":11846078.64,"avg_time_to_close_pull_request":941192.7423312883,"issues_closed_count":75,"pull_requests_closed_count":163,"pull_request_authors_count":33,"issue_authors_count":45,"avg_comments_per_issue":1.6046511627906976,"avg_comments_per_pull_request":0.3783783783783784,"merged_pull_requests_count":144,"bot_issues_count":0,"bot_pull_requests_count":11,"past_year_issues_count":18,"past_year_pull_requests_count":62,"past_year_avg_time_to_close_issue":5152110.8,"past_year_avg_time_to_close_pull_request":1591246.177777778,"past_year_issues_closed_count":10,"past_year_pull_requests_closed_count":45,"past_year_pull_request_authors_count":15,"past_year_issue_authors_count":15,"past_year_avg_comments_per_issue":0.8333333333333334,"past_year_avg_comments_per_pull_request":0.3225806451612903,"past_year_bot_issues_count":0,"past_year_bot_pull_requests_count":2,"past_year_merged_pull_requests_count":38,"created_at":"2024-01-04T00:14:41.355Z","updated_at":"2025-09-03T06:48:24.812Z","repository_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma","issues_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/allenai%2Fdolma/issues","issue_labels_count":{"enhancement":5},"pull_request_labels_count":{"dependencies":17,"python":2,"github_actions":2,"rust":1},"issue_author_associations_count":{"NONE":65,"CONTRIBUTOR":11,"MEMBER":8},"pull_request_author_associations_count":{"MEMBER":131,"CONTRIBUTOR":92,"NONE":23,"COLLABORATOR":8},"issue_authors":{"hannahzacharski55":20,"soldni":8,"peterbjorgensen":7,"mihara-bot":3,"wannaphong":3,"yushengsu-thu":2,"mrqorib":2,"chschroeder":2,"codefly13":2,"zxnie":1,"Jackwaterveg":1,"ehartford":1,"silverriver":1,"joellliu":1,"XevWright":1,"Tendo33":1,"msaebi1993":1,"WenJett":1,"Vedaad-Shakib":1,"aleien95":1,"RohitRathore1":1,"simonw":1,"aetting":1,"Jianxin-MNM":1,"XiaozhuLove":1,"chris-ha458":1,"mathCrazyy":1,"leeparkuky":1,"RobinQrtz":1,"TTTTao725":1,"revbucket":1,"Nevermetyou65":1,"boxabirds":1,"andrewhojel":1,"baberabb":1,"suolyer":1,"hwijeen":1,"tokenizer-decode":1,"davidbrandfonbrener":1,"john-hewitt":1,"jtalmi":1,"DangoWang":1,"ahmeda14960":1,"KennethEnevoldsen":1},"pull_request_authors":{"soldni":123,"undfined":30,"dependabot[bot]":17,"Whattabatt":9,"kyleclo":8,"peterbjorgensen":8,"chris-ha458":5,"cmwilhelm":5,"no0p":4,"revbucket":4,"yushengsu-thu":3,"Muennighoff":3,"rodneykinney":3,"mariia-iureva":2,"power10dan":2,"epwalsh":2,"arnavic":2,"phishing-database-bot":2,"eltociear":2,"RohitRathore1":2,"simonw":2,"guspan-tanadi":2,"KennethEnevoldsen":2,"regan-huff":2,"IanMagnusson":2,"aman-17":2,"segyges":1,"drschwenk":1,"jacob-morrison":1,"dirkgr":1,"ianand":1,"benbogin":1},"host":{"name":"GitHub","url":"https://github.com","kind":"github","last_synced_at":"2025-09-05T00:00:10.444Z","repositories_count":10100117,"issues_count":31473266,"pull_requests_count":97445500,"authors_count":10702683,"icon_url":"https://github.com/github.png","host_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories","owners_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/owners","authors_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors"},"past_year_issue_labels_count":{},"past_year_pull_request_labels_count":{"dependencies":1,"rust":1},"past_year_issue_author_associations_count":{"NONE":17,"MEMBER":1},"past_year_pull_request_author_associations_count":{"CONTRIBUTOR":38,"MEMBER":21,"NONE":12,"COLLABORATOR":2},"past_year_issue_authors":{"wannaphong":3,"mrqorib":2,"aetting":1,"ahmeda14960":1,"ehartford":1,"joellliu":1,"msaebi1993":1,"Nevermetyou65":1,"revbucket":1,"RobinQrtz":1,"soldni":1,"WenJett":1,"XevWright":1,"XiaozhuLove":1,"zxnie":1},"past_year_pull_request_authors":{"undfined":22,"soldni":19,"Whattabatt":5,"cmwilhelm":5,"revbucket":4,"no0p":4,"regan-huff":2,"phishing-database-bot":2,"mariia-iureva":2,"guspan-tanadi":2,"aman-17":2,"kyleclo":2,"segyges":1,"dependabot[bot]":1},"maintainers":[{"login":"soldni","count":131,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/soldni"},{"login":"kyleclo","count":8,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/kyleclo"},{"login":"rodneykinney","count":3,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/rodneykinney"},{"login":"aman-17","count":2,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/aman-17"},{"login":"epwalsh","count":2,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/epwalsh"},{"login":"dirkgr","count":1,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/dirkgr"}],"active_maintainers":[{"login":"soldni","count":20,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/soldni"},{"login":"aman-17","count":2,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/aman-17"},{"login":"kyleclo","count":2,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/kyleclo"}]},"events":{"total":{"CreateEvent":75,"ReleaseEvent":4,"IssuesEvent":42,"WatchEvent":304,"DeleteEvent":30,"IssueCommentEvent":52,"PushEvent":517,"PullRequestReviewCommentEvent":31,"PullRequestReviewEvent":53,"PullRequestEvent":62,"ForkEvent":43},"last_year":{"CreateEvent":75,"ReleaseEvent":4,"IssuesEvent":42,"WatchEvent":304,"DeleteEvent":30,"IssueCommentEvent":52,"PushEvent":517,"PullRequestReviewCommentEvent":31,"PullRequestReviewEvent":53,"PullRequestEvent":62,"ForkEvent":43}},"keywords":["data-processing","large-language-models","llm","machile-learning","nlp"],"dependencies":[{"ecosystem":"actions","filepath":".github/workflows/CI.yml","sha":null,"kind":"manifest","created_at":"2023-07-17T00:31:31.960Z","updated_at":"2023-07-17T00:31:31.960Z","repository_link":"https://github.com/allenai/dolma/blob/main/.github/workflows/CI.yml","dependencies":[{"id":11586628754,"package_name":"actions/checkout","ecosystem":"actions","requirements":"v1","direct":true,"kind":"composite","optional":false},{"id":11586628757,"package_name":"actions-rs/toolchain","ecosystem":"actions","requirements":"v1","direct":true,"kind":"composite","optional":false},{"id":11586628759,"package_name":"actions/setup-python","ecosystem":"actions","requirements":"v2","direct":true,"kind":"composite","optional":false},{"id":11586628761,"package_name":"actions/checkout","ecosystem":"actions","requirements":"v3","direct":true,"kind":"composite","optional":false},{"id":11586628763,"package_name":"actions/setup-python","ecosystem":"actions","requirements":"v4","direct":true,"kind":"composite","optional":false},{"id":11586628764,"package_name":"PyO3/maturin-action","ecosystem":"actions","requirements":"v1","direct":true,"kind":"composite","optional":false},{"id":11586628766,"package_name":"actions/upload-artifact","ecosystem":"actions","requirements":"v3","direct":true,"kind":"composite","optional":false},{"id":11586628768,"package_name":"actions/download-artifact","ecosystem":"actions","requirements":"v3","direct":true,"kind":"composite","optional":false}]},{"ecosystem":"cargo","filepath":"Cargo.lock","sha":null,"kind":"lockfile","created_at":"2023-07-17T00:31:34.027Z","updated_at":"2023-07-17T00:31:34.027Z","repository_link":"https://github.com/allenai/dolma/blob/main/Cargo.lock","dependencies":[{"id":11586629710,"package_name":"adler","ecosystem":"cargo","requirements":"1.0.2","direct":false,"kind":"runtime","optional":false},{"id":11586629711,"package_name":"ahash","ecosystem":"cargo","requirements":"0.8.3","direct":false,"kind":"runtime","optional":false},{"id":11586629712,"package_name":"aho-corasick","ecosystem":"cargo","requirements":"1.0.2","direct":false,"kind":"runtime","optional":false},{"id":11586629713,"package_name":"anstream","ecosystem":"cargo","requirements":"0.3.2","direct":false,"kind":"runtime","optional":false},{"id":11586629714,"package_name":"anstyle","ecosystem":"cargo","requirements":"1.0.1","direct":false,"kind":"runtime","optional":false},{"id":11586629715,"package_name":"anstyle-parse","ecosystem":"cargo","requirements":"0.2.1","direct":false,"kind":"runtime","optional":false},{"id":11586629716,"package_name":"anstyle-query","ecosystem":"cargo","requirements":"1.0.0","direct":false,"kind":"runtime","optional":false},{"id":11586629717,"package_name":"anstyle-wincon","ecosystem":"cargo","requirements":"1.0.1","direct":false,"kind":"runtime","optional":false},{"id":11586629718,"package_name":"autocfg","ecosystem":"cargo","requirements":"1.1.0","direct":false,"kind":"runtime","optional":false},{"id":11586629719,"package_name":"aws-config","ecosystem":"cargo","requirements":"0.55.3","direct":false,"kind":"runtime","optional":false},{"id":11586629720,"package_name":"aws-credential-types","ecosystem":"cargo","requirements":"0.55.3","direct":false,"kind":"runtime","optional":false},{"id":11586629721,"package_name":"aws-endpoint","ecosystem":"cargo","requirements":"0.55.3","direct":false,"kind":"runtime","optional":false},{"id":11586629722,"package_name":"aws-http","ecosystem":"cargo","requirements":"0.55.3","direct":false,"kind":"runtime","optional":false},{"id":11586629723,"package_name":"aws-sdk-s3","ecosystem":"cargo","requirements":"0.25.1","direct":false,"kind":"runtime","optional":false},{"id":11586629724,"package_name":"aws-sdk-sso","ecosystem":"cargo","requirements":"0.28.0","direct":false,"kind":"runtime","optional":false},{"id":11586629725,"package_name":"aws-sdk-sts","ecosystem":"cargo","requirements":"0.28.0","direct":false,"kind":"runtime","optional":false},{"id":11586629726,"package_name":"aws-sig-auth","ecosystem":"cargo","requirements":"0.55.3","direct":false,"kind":"runtime","optional":false},{"id":11586629727,"package_name":"aws-sigv4","ecosystem":"cargo","requirements":"0.55.3","direct":false,"kind":"runtime","optional":false},{"id":11586629728,"package_name":"aws-smithy-async","ecosystem":"cargo","requirements":"0.55.3","direct":false,"kind":"runtime","optional":false},{"id":11586629729,"package_name":"aws-smithy-checksums","ecosystem":"cargo","requirements":"0.55.3","direct":false,"kind":"runtime","optional":false},{"id":11586629730,"package_name":"aws-smithy-client","ecosystem":"cargo","requirements":"0.55.3","direct":false,"kind":"runtime","optional":false},{"id":11586629731,"package_name":"aws-smithy-eventstream","ecosystem":"cargo","requirements":"0.55.3","direct":false,"kind":"runtime","optional":false},{"id":11586629732,"package_name":"aws-smithy-http","ecosystem":"cargo","requirements":"0.55.3","direct":false,"kind":"runtime","optional":false},{"id":11586629733,"package_name":"aws-smithy-http-tower","ecosystem":"cargo","requirements":"0.55.3","direct":false,"kind":"runtime","optional":false},{"id":11586629734,"package_name":"aws-smithy-json","ecosystem":"cargo","requirements":"0.55.3","direct":false,"kind":"runtime","optional":false},{"id":11586629735,"package_name":"aws-smithy-query","ecosystem":"cargo","requirements":"0.55.3","direct":false,"kind":"runtime","optional":false},{"id":11586629736,"package_name":"aws-smithy-types","ecosystem":"cargo","requirements":"0.55.3","direct":false,"kind":"runtime","optional":false},{"id":11586629737,"package_name":"aws-smithy-xml","ecosystem":"cargo","requirements":"0.55.3","direct":false,"kind":"runtime","optional":false},{"id":11586629738,"package_name":"aws-types","ecosystem":"cargo","requirements":"0.55.3","direct":false,"kind":"runtime","optional":false},{"id":11586629739,"package_name":"base64","ecosystem":"cargo","requirements":"0.21.2","direct":false,"kind":"runtime","optional":false},{"id":11586629740,"package_name":"base64-simd","ecosystem":"cargo","requirements":"0.8.0","direct":false,"kind":"runtime","optional":false},{"id":11586629741,"package_name":"bitflags","ecosystem":"cargo","requirements":"1.3.2","direct":false,"kind":"runtime","optional":false},{"id":11586629742,"package_name":"block-buffer","ecosystem":"cargo","requirements":"0.10.4","direct":false,"kind":"runtime","optional":false},{"id":11586629743,"package_name":"bumpalo","ecosystem":"cargo","requirements":"3.13.0","direct":false,"kind":"runtime","optional":false},{"id":11586629744,"package_name":"byteorder","ecosystem":"cargo","requirements":"1.4.3","direct":false,"kind":"runtime","optional":false},{"id":11586629745,"package_name":"bytes","ecosystem":"cargo","requirements":"1.4.0","direct":false,"kind":"runtime","optional":false},{"id":11586629746,"package_name":"bytes-utils","ecosystem":"cargo","requirements":"0.1.3","direct":false,"kind":"runtime","optional":false},{"id":11586629748,"package_name":"cc","ecosystem":"cargo","requirements":"1.0.79","direct":false,"kind":"runtime","optional":false},{"id":11586629749,"package_name":"cfg-if","ecosystem":"cargo","requirements":"1.0.0","direct":false,"kind":"runtime","optional":false},{"id":11586629750,"package_name":"clap","ecosystem":"cargo","requirements":"4.3.8","direct":false,"kind":"runtime","optional":false},{"id":11586629752,"package_name":"clap_builder","ecosystem":"cargo","requirements":"4.3.8","direct":false,"kind":"runtime","optional":false},{"id":11586629754,"package_name":"clap_derive","ecosystem":"cargo","requirements":"4.3.2","direct":false,"kind":"runtime","optional":false},{"id":11586629756,"package_name":"clap_lex","ecosystem":"cargo","requirements":"0.5.0","direct":false,"kind":"runtime","optional":false},{"id":11586629757,"package_name":"cmake","ecosystem":"cargo","requirements":"0.1.50","direct":false,"kind":"runtime","optional":false},{"id":11586629758,"package_name":"colorchoice","ecosystem":"cargo","requirements":"1.0.0","direct":false,"kind":"runtime","optional":false},{"id":11586629759,"package_name":"core-foundation","ecosystem":"cargo","requirements":"0.9.3","direct":false,"kind":"runtime","optional":false},{"id":11586629760,"package_name":"core-foundation-sys","ecosystem":"cargo","requirements":"0.8.4","direct":false,"kind":"runtime","optional":false},{"id":11586629761,"package_name":"cpufeatures","ecosystem":"cargo","requirements":"0.2.8","direct":false,"kind":"runtime","optional":false},{"id":11586629762,"package_name":"crc32c","ecosystem":"cargo","requirements":"0.6.3","direct":false,"kind":"runtime","optional":false},{"id":11586629763,"package_name":"crc32fast","ecosystem":"cargo","requirements":"1.3.2","direct":false,"kind":"runtime","optional":false},{"id":11586629764,"package_name":"crossbeam-channel","ecosystem":"cargo","requirements":"0.5.8","direct":false,"kind":"runtime","optional":false},{"id":11586629765,"package_name":"crossbeam-deque","ecosystem":"cargo","requirements":"0.8.3","direct":false,"kind":"runtime","optional":false},{"id":11586629766,"package_name":"crossbeam-epoch","ecosystem":"cargo","requirements":"0.9.15","direct":false,"kind":"runtime","optional":false},{"id":11586629767,"package_name":"crossbeam-utils","ecosystem":"cargo","requirements":"0.8.16","direct":false,"kind":"runtime","optional":false},{"id":11586629768,"package_name":"crypto-common","ecosystem":"cargo","requirements":"0.1.6","direct":false,"kind":"runtime","optional":false},{"id":11586629769,"package_name":"digest","ecosystem":"cargo","requirements":"0.10.7","direct":false,"kind":"runtime","optional":false},{"id":11586629770,"package_name":"either","ecosystem":"cargo","requirements":"1.8.1","direct":false,"kind":"runtime","optional":false},{"id":11586629771,"package_name":"env_logger","ecosystem":"cargo","requirements":"0.10.0","direct":false,"kind":"runtime","optional":false},{"id":11586629772,"package_name":"errno","ecosystem":"cargo","requirements":"0.3.1","direct":false,"kind":"runtime","optional":false},{"id":11586629773,"package_name":"errno-dragonfly","ecosystem":"cargo","requirements":"0.1.2","direct":false,"kind":"runtime","optional":false},{"id":11586629774,"package_name":"fastrand","ecosystem":"cargo","requirements":"1.9.0","direct":false,"kind":"runtime","optional":false},{"id":11586629775,"package_name":"flate2","ecosystem":"cargo","requirements":"1.0.26","direct":false,"kind":"runtime","optional":false},{"id":11586629776,"package_name":"fnv","ecosystem":"cargo","requirements":"1.0.7","direct":false,"kind":"runtime","optional":false},{"id":11586629777,"package_name":"form_urlencoded","ecosystem":"cargo","requirements":"1.2.0","direct":false,"kind":"runtime","optional":false},{"id":11586629778,"package_name":"futures-channel","ecosystem":"cargo","requirements":"0.3.28","direct":false,"kind":"runtime","optional":false},{"id":11586629779,"package_name":"futures-core","ecosystem":"cargo","requirements":"0.3.28","direct":false,"kind":"runtime","optional":false},{"id":11586629780,"package_name":"futures-sink","ecosystem":"cargo","requirements":"0.3.28","direct":false,"kind":"runtime","optional":false},{"id":11586629781,"package_name":"futures-task","ecosystem":"cargo","requirements":"0.3.28","direct":false,"kind":"runtime","optional":false},{"id":11586629782,"package_name":"futures-util","ecosystem":"cargo","requirements":"0.3.28","direct":false,"kind":"runtime","optional":false},{"id":11586629783,"package_name":"generic-array","ecosystem":"cargo","requirements":"0.14.7","direct":false,"kind":"runtime","optional":false},{"id":11586629784,"package_name":"getrandom","ecosystem":"cargo","requirements":"0.2.10","direct":false,"kind":"runtime","optional":false},{"id":11586629785,"package_name":"glob","ecosystem":"cargo","requirements":"0.3.1","direct":false,"kind":"runtime","optional":false},{"id":11586629786,"package_name":"h2","ecosystem":"cargo","requirements":"0.3.20","direct":false,"kind":"runtime","optional":false},{"id":11586629787,"package_name":"hashbrown","ecosystem":"cargo","requirements":"0.12.3","direct":false,"kind":"runtime","optional":false},{"id":11586629788,"package_name":"heck","ecosystem":"cargo","requirements":"0.4.1","direct":false,"kind":"runtime","optional":false},{"id":11586629789,"package_name":"hermit-abi","ecosystem":"cargo","requirements":"0.2.6","direct":false,"kind":"runtime","optional":false},{"id":11586629790,"package_name":"hermit-abi","ecosystem":"cargo","requirements":"0.3.1","direct":false,"kind":"runtime","optional":false},{"id":11586629791,"package_name":"hex","ecosystem":"cargo","requirements":"0.4.3","direct":false,"kind":"runtime","optional":false},{"id":11586629792,"package_name":"hmac","ecosystem":"cargo","requirements":"0.12.1","direct":false,"kind":"runtime","optional":false},{"id":11586629793,"package_name":"http","ecosystem":"cargo","requirements":"0.2.9","direct":false,"kind":"runtime","optional":false},{"id":11586629794,"package_name":"http-body","ecosystem":"cargo","requirements":"0.4.5","direct":false,"kind":"runtime","optional":false},{"id":11586629795,"package_name":"httparse","ecosystem":"cargo","requirements":"1.8.0","direct":false,"kind":"runtime","optional":false},{"id":11586629796,"package_name":"httpdate","ecosystem":"cargo","requirements":"1.0.2","direct":false,"kind":"runtime","optional":false},{"id":11586629797,"package_name":"humantime","ecosystem":"cargo","requirements":"2.1.0","direct":false,"kind":"runtime","optional":false},{"id":11586629798,"package_name":"hyper","ecosystem":"cargo","requirements":"0.14.27","direct":false,"kind":"runtime","optional":false},{"id":11586629799,"package_name":"hyper-rustls","ecosystem":"cargo","requirements":"0.23.2","direct":false,"kind":"runtime","optional":false},{"id":11586629800,"package_name":"idna","ecosystem":"cargo","requirements":"0.4.0","direct":false,"kind":"runtime","optional":false},{"id":11586629801,"package_name":"indexmap","ecosystem":"cargo","requirements":"1.9.3","direct":false,"kind":"runtime","optional":false},{"id":11586629802,"package_name":"indoc","ecosystem":"cargo","requirements":"1.0.9","direct":false,"kind":"runtime","optional":false},{"id":11586629803,"package_name":"instant","ecosystem":"cargo","requirements":"0.1.12","direct":false,"kind":"runtime","optional":false},{"id":11586629804,"package_name":"io-lifetimes","ecosystem":"cargo","requirements":"1.0.11","direct":false,"kind":"runtime","optional":false},{"id":11586629805,"package_name":"is-terminal","ecosystem":"cargo","requirements":"0.4.7","direct":false,"kind":"runtime","optional":false},{"id":11586629806,"package_name":"itoa","ecosystem":"cargo","requirements":"1.0.6","direct":false,"kind":"runtime","optional":false},{"id":11586629807,"package_name":"js-sys","ecosystem":"cargo","requirements":"0.3.64","direct":false,"kind":"runtime","optional":false},{"id":11586629808,"package_name":"jsonpath-rust","ecosystem":"cargo","requirements":"0.3.0","direct":false,"kind":"runtime","optional":false},{"id":11586629809,"package_name":"lazy_static","ecosystem":"cargo","requirements":"1.4.0","direct":false,"kind":"runtime","optional":false},{"id":11586629810,"package_name":"libc","ecosystem":"cargo","requirements":"0.2.147","direct":false,"kind":"runtime","optional":false},{"id":11586629811,"package_name":"libz-ng-sys","ecosystem":"cargo","requirements":"1.1.9","direct":false,"kind":"runtime","optional":false},{"id":11586629812,"package_name":"linux-raw-sys","ecosystem":"cargo","requirements":"0.3.8","direct":false,"kind":"runtime","optional":false},{"id":11586629813,"package_name":"lock_api","ecosystem":"cargo","requirements":"0.4.10","direct":false,"kind":"runtime","optional":false},{"id":11586629814,"package_name":"log","ecosystem":"cargo","requirements":"0.4.19","direct":false,"kind":"runtime","optional":false},{"id":11586629815,"package_name":"md-5","ecosystem":"cargo","requirements":"0.10.5","direct":false,"kind":"runtime","optional":false},{"id":11586629816,"package_name":"memchr","ecosystem":"cargo","requirements":"2.5.0","direct":false,"kind":"runtime","optional":false},{"id":11586629817,"package_name":"memoffset","ecosystem":"cargo","requirements":"0.9.0","direct":false,"kind":"runtime","optional":false},{"id":11586629818,"package_name":"miniz_oxide","ecosystem":"cargo","requirements":"0.7.1","direct":false,"kind":"runtime","optional":false},{"id":11586629819,"package_name":"mio","ecosystem":"cargo","requirements":"0.8.8","direct":false,"kind":"runtime","optional":false},{"id":11586629820,"package_name":"num-integer","ecosystem":"cargo","requirements":"0.1.45","direct":false,"kind":"runtime","optional":false},{"id":11586629821,"package_name":"num-traits","ecosystem":"cargo","requirements":"0.2.15","direct":false,"kind":"runtime","optional":false},{"id":11586629822,"package_name":"num_cpus","ecosystem":"cargo","requirements":"1.15.0","direct":false,"kind":"runtime","optional":false},{"id":11586629823,"package_name":"once_cell","ecosystem":"cargo","requirements":"1.18.0","direct":false,"kind":"runtime","optional":false},{"id":11586629824,"package_name":"openssl-probe","ecosystem":"cargo","requirements":"0.1.5","direct":false,"kind":"runtime","optional":false},{"id":11586629825,"package_name":"outref","ecosystem":"cargo","requirements":"0.5.1","direct":false,"kind":"runtime","optional":false},{"id":11586629826,"package_name":"parking_lot","ecosystem":"cargo","requirements":"0.12.1","direct":false,"kind":"runtime","optional":false},{"id":11586629827,"package_name":"parking_lot_core","ecosystem":"cargo","requirements":"0.9.8","direct":false,"kind":"runtime","optional":false},{"id":11586629828,"package_name":"percent-encoding","ecosystem":"cargo","requirements":"2.3.0","direct":false,"kind":"runtime","optional":false},{"id":11586629829,"package_name":"pest","ecosystem":"cargo","requirements":"2.7.0","direct":false,"kind":"runtime","optional":false},{"id":11586629830,"package_name":"pest_derive","ecosystem":"cargo","requirements":"2.7.0","direct":false,"kind":"runtime","optional":false},{"id":11586629831,"package_name":"pest_generator","ecosystem":"cargo","requirements":"2.7.0","direct":false,"kind":"runtime","optional":false},{"id":11586629832,"package_name":"pest_meta","ecosystem":"cargo","requirements":"2.7.0","direct":false,"kind":"runtime","optional":false},{"id":11586629833,"package_name":"pin-project","ecosystem":"cargo","requirements":"1.1.0","direct":false,"kind":"runtime","optional":false},{"id":11586629834,"package_name":"pin-project-internal","ecosystem":"cargo","requirements":"1.1.0","direct":false,"kind":"runtime","optional":false},{"id":11586629835,"package_name":"pin-project-lite","ecosystem":"cargo","requirements":"0.2.9","direct":false,"kind":"runtime","optional":false},{"id":11586629836,"package_name":"pin-utils","ecosystem":"cargo","requirements":"0.1.0","direct":false,"kind":"runtime","optional":false},{"id":11586629837,"package_name":"ppv-lite86","ecosystem":"cargo","requirements":"0.2.17","direct":false,"kind":"runtime","optional":false},{"id":11586629838,"package_name":"proc-macro2","ecosystem":"cargo","requirements":"1.0.63","direct":false,"kind":"runtime","optional":false},{"id":11586629839,"package_name":"pyo3","ecosystem":"cargo","requirements":"0.19.0","direct":false,"kind":"runtime","optional":false},{"id":11586629840,"package_name":"pyo3-build-config","ecosystem":"cargo","requirements":"0.19.0","direct":false,"kind":"runtime","optional":false},{"id":11586629841,"package_name":"pyo3-ffi","ecosystem":"cargo","requirements":"0.19.0","direct":false,"kind":"runtime","optional":false},{"id":11586629842,"package_name":"pyo3-macros","ecosystem":"cargo","requirements":"0.19.0","direct":false,"kind":"runtime","optional":false},{"id":11586629843,"package_name":"pyo3-macros-backend","ecosystem":"cargo","requirements":"0.19.0","direct":false,"kind":"runtime","optional":false},{"id":11586629844,"package_name":"quote","ecosystem":"cargo","requirements":"1.0.28","direct":false,"kind":"runtime","optional":false},{"id":11586629845,"package_name":"rand","ecosystem":"cargo","requirements":"0.8.5","direct":false,"kind":"runtime","optional":false},{"id":11586629846,"package_name":"rand_chacha","ecosystem":"cargo","requirements":"0.3.1","direct":false,"kind":"runtime","optional":false},{"id":11586629847,"package_name":"rand_core","ecosystem":"cargo","requirements":"0.6.4","direct":false,"kind":"runtime","optional":false},{"id":11586629848,"package_name":"rayon","ecosystem":"cargo","requirements":"1.7.0","direct":false,"kind":"runtime","optional":false},{"id":11586629849,"package_name":"rayon-core","ecosystem":"cargo","requirements":"1.11.0","direct":false,"kind":"runtime","optional":false},{"id":11586629850,"package_name":"redox_syscall","ecosystem":"cargo","requirements":"0.3.5","direct":false,"kind":"runtime","optional":false},{"id":11586629851,"package_name":"regex","ecosystem":"cargo","requirements":"1.8.4","direct":false,"kind":"runtime","optional":false},{"id":11586629852,"package_name":"regex-syntax","ecosystem":"cargo","requirements":"0.7.2","direct":false,"kind":"runtime","optional":false},{"id":11586629853,"package_name":"ring","ecosystem":"cargo","requirements":"0.16.20","direct":false,"kind":"runtime","optional":false},{"id":11586629854,"package_name":"rustc_version","ecosystem":"cargo","requirements":"0.4.0","direct":false,"kind":"runtime","optional":false},{"id":11586629855,"package_name":"rustix","ecosystem":"cargo","requirements":"0.37.20","direct":false,"kind":"runtime","optional":false},{"id":11586629856,"package_name":"rustls","ecosystem":"cargo","requirements":"0.20.8","direct":false,"kind":"runtime","optional":false},{"id":11586629857,"package_name":"rustls-native-certs","ecosystem":"cargo","requirements":"0.6.3","direct":false,"kind":"runtime","optional":false},{"id":11586629858,"package_name":"rustls-pemfile","ecosystem":"cargo","requirements":"1.0.2","direct":false,"kind":"runtime","optional":false},{"id":11586629859,"package_name":"ryu","ecosystem":"cargo","requirements":"1.0.13","direct":false,"kind":"runtime","optional":false},{"id":11586629860,"package_name":"schannel","ecosystem":"cargo","requirements":"0.1.21","direct":false,"kind":"runtime","optional":false},{"id":11586629861,"package_name":"scopeguard","ecosystem":"cargo","requirements":"1.1.0","direct":false,"kind":"runtime","optional":false},{"id":11586629862,"package_name":"sct","ecosystem":"cargo","requirements":"0.7.0","direct":false,"kind":"runtime","optional":false},{"id":11586629863,"package_name":"security-framework","ecosystem":"cargo","requirements":"2.9.1","direct":false,"kind":"runtime","optional":false},{"id":11586629864,"package_name":"security-framework-sys","ecosystem":"cargo","requirements":"2.9.0","direct":false,"kind":"runtime","optional":false},{"id":11586629865,"package_name":"semver","ecosystem":"cargo","requirements":"1.0.17","direct":false,"kind":"runtime","optional":false},{"id":11586629866,"package_name":"serde","ecosystem":"cargo","requirements":"1.0.164","direct":false,"kind":"runtime","optional":false},{"id":11586629867,"package_name":"serde_derive","ecosystem":"cargo","requirements":"1.0.164","direct":false,"kind":"runtime","optional":false},{"id":11586629868,"package_name":"serde_json","ecosystem":"cargo","requirements":"1.0.99","direct":false,"kind":"runtime","optional":false},{"id":11586629869,"package_name":"sha1","ecosystem":"cargo","requirements":"0.10.5","direct":false,"kind":"runtime","optional":false},{"id":11586629870,"package_name":"sha2","ecosystem":"cargo","requirements":"0.10.7","direct":false,"kind":"runtime","optional":false},{"id":11586629871,"package_name":"signal-hook-registry","ecosystem":"cargo","requirements":"1.4.1","direct":false,"kind":"runtime","optional":false},{"id":11586629872,"package_name":"slab","ecosystem":"cargo","requirements":"0.4.8","direct":false,"kind":"runtime","optional":false},{"id":11586629873,"package_name":"smallvec","ecosystem":"cargo","requirements":"1.10.0","direct":false,"kind":"runtime","optional":false},{"id":11586629874,"package_name":"socket2","ecosystem":"cargo","requirements":"0.4.9","direct":false,"kind":"runtime","optional":false},{"id":11586629875,"package_name":"spin","ecosystem":"cargo","requirements":"0.5.2","direct":false,"kind":"runtime","optional":false},{"id":11586629876,"package_name":"strsim","ecosystem":"cargo","requirements":"0.10.0","direct":false,"kind":"runtime","optional":false},{"id":11586629877,"package_name":"subtle","ecosystem":"cargo","requirements":"2.5.0","direct":false,"kind":"runtime","optional":false},{"id":11586629878,"package_name":"syn","ecosystem":"cargo","requirements":"1.0.109","direct":false,"kind":"runtime","optional":false},{"id":11586629879,"package_name":"syn","ecosystem":"cargo","requirements":"2.0.22","direct":false,"kind":"runtime","optional":false},{"id":11586629880,"package_name":"target-lexicon","ecosystem":"cargo","requirements":"0.12.8","direct":false,"kind":"runtime","optional":false},{"id":11586629881,"package_name":"termcolor","ecosystem":"cargo","requirements":"1.2.0","direct":false,"kind":"runtime","optional":false},{"id":11586629882,"package_name":"thiserror","ecosystem":"cargo","requirements":"1.0.40","direct":false,"kind":"runtime","optional":false},{"id":11586629883,"package_name":"thiserror-impl","ecosystem":"cargo","requirements":"1.0.40","direct":false,"kind":"runtime","optional":false},{"id":11586629884,"package_name":"threadpool","ecosystem":"cargo","requirements":"1.8.1","direct":false,"kind":"runtime","optional":false},{"id":11586629885,"package_name":"time","ecosystem":"cargo","requirements":"0.3.22","direct":false,"kind":"runtime","optional":false},{"id":11586629886,"package_name":"time-core","ecosystem":"cargo","requirements":"0.1.1","direct":false,"kind":"runtime","optional":false},{"id":11586629887,"package_name":"time-macros","ecosystem":"cargo","requirements":"0.2.9","direct":false,"kind":"runtime","optional":false},{"id":11586629888,"package_name":"tinyvec","ecosystem":"cargo","requirements":"1.6.0","direct":false,"kind":"runtime","optional":false},{"id":11586629889,"package_name":"tinyvec_macros","ecosystem":"cargo","requirements":"0.1.1","direct":false,"kind":"runtime","optional":false},{"id":11586629890,"package_name":"tokio","ecosystem":"cargo","requirements":"1.28.2","direct":false,"kind":"runtime","optional":false},{"id":11586629891,"package_name":"tokio-macros","ecosystem":"cargo","requirements":"2.1.0","direct":false,"kind":"runtime","optional":false},{"id":11586629892,"package_name":"tokio-rustls","ecosystem":"cargo","requirements":"0.23.4","direct":false,"kind":"runtime","optional":false},{"id":11586629893,"package_name":"tokio-stream","ecosystem":"cargo","requirements":"0.1.14","direct":false,"kind":"runtime","optional":false},{"id":11586629894,"package_name":"tokio-util","ecosystem":"cargo","requirements":"0.7.8","direct":false,"kind":"runtime","optional":false},{"id":11586629895,"package_name":"tower","ecosystem":"cargo","requirements":"0.4.13","direct":false,"kind":"runtime","optional":false},{"id":11586629896,"package_name":"tower-layer","ecosystem":"cargo","requirements":"0.3.2","direct":false,"kind":"runtime","optional":false},{"id":11586629897,"package_name":"tower-service","ecosystem":"cargo","requirements":"0.3.2","direct":false,"kind":"runtime","optional":false},{"id":11586629898,"package_name":"tracing","ecosystem":"cargo","requirements":"0.1.37","direct":false,"kind":"runtime","optional":false},{"id":11586629899,"package_name":"tracing-attributes","ecosystem":"cargo","requirements":"0.1.26","direct":false,"kind":"runtime","optional":false},{"id":11586629900,"package_name":"tracing-core","ecosystem":"cargo","requirements":"0.1.31","direct":false,"kind":"runtime","optional":false},{"id":11586629901,"package_name":"try-lock","ecosystem":"cargo","requirements":"0.2.4","direct":false,"kind":"runtime","optional":false},{"id":11586629902,"package_name":"typenum","ecosystem":"cargo","requirements":"1.16.0","direct":false,"kind":"runtime","optional":false},{"id":11586629903,"package_name":"ucd-trie","ecosystem":"cargo","requirements":"0.1.5","direct":false,"kind":"runtime","optional":false},{"id":11586629904,"package_name":"unicode-bidi","ecosystem":"cargo","requirements":"0.3.13","direct":false,"kind":"runtime","optional":false},{"id":11586629905,"package_name":"unicode-ident","ecosystem":"cargo","requirements":"1.0.9","direct":false,"kind":"runtime","optional":false},{"id":11586629906,"package_name":"unicode-normalization","ecosystem":"cargo","requirements":"0.1.22","direct":false,"kind":"runtime","optional":false},{"id":11586629907,"package_name":"unicode-segmentation","ecosystem":"cargo","requirements":"1.10.1","direct":false,"kind":"runtime","optional":false},{"id":11586629908,"package_name":"unindent","ecosystem":"cargo","requirements":"0.1.11","direct":false,"kind":"runtime","optional":false},{"id":11586629909,"package_name":"untrusted","ecosystem":"cargo","requirements":"0.7.1","direct":false,"kind":"runtime","optional":false},{"id":11586629910,"package_name":"url","ecosystem":"cargo","requirements":"2.4.0","direct":false,"kind":"runtime","optional":false},{"id":11586629911,"package_name":"urlencoding","ecosystem":"cargo","requirements":"2.1.2","direct":false,"kind":"runtime","optional":false},{"id":11586629912,"package_name":"utf8parse","ecosystem":"cargo","requirements":"0.2.1","direct":false,"kind":"runtime","optional":false},{"id":11586629913,"package_name":"version_check","ecosystem":"cargo","requirements":"0.9.4","direct":false,"kind":"runtime","optional":false},{"id":11586629914,"package_name":"vsimd","ecosystem":"cargo","requirements":"0.8.0","direct":false,"kind":"runtime","optional":false},{"id":11586629915,"package_name":"want","ecosystem":"cargo","requirements":"0.3.1","direct":false,"kind":"runtime","optional":false},{"id":11586629916,"package_name":"wasi","ecosystem":"cargo","requirements":"0.11.0+wasi-snapshot-preview1","direct":false,"kind":"runtime","optional":false},{"id":11586629917,"package_name":"wasm-bindgen","ecosystem":"cargo","requirements":"0.2.87","direct":false,"kind":"runtime","optional":false},{"id":11586629918,"package_name":"wasm-bindgen-backend","ecosystem":"cargo","requirements":"0.2.87","direct":false,"kind":"runtime","optional":false},{"id":11586629919,"package_name":"wasm-bindgen-macro","ecosystem":"cargo","requirements":"0.2.87","direct":false,"kind":"runtime","optional":false},{"id":11586629920,"package_name":"wasm-bindgen-macro-support","ecosystem":"cargo","requirements":"0.2.87","direct":false,"kind":"runtime","optional":false},{"id":11586629921,"package_name":"wasm-bindgen-shared","ecosystem":"cargo","requirements":"0.2.87","direct":false,"kind":"runtime","optional":false},{"id":11586629922,"package_name":"web-sys","ecosystem":"cargo","requirements":"0.3.64","direct":false,"kind":"runtime","optional":false},{"id":11586629923,"package_name":"webpki","ecosystem":"cargo","requirements":"0.22.0","direct":false,"kind":"runtime","optional":false},{"id":11586629924,"package_name":"winapi","ecosystem":"cargo","requirements":"0.3.9","direct":false,"kind":"runtime","optional":false},{"id":11586629925,"package_name":"winapi-i686-pc-windows-gnu","ecosystem":"cargo","requirements":"0.4.0","direct":false,"kind":"runtime","optional":false},{"id":11586629926,"package_name":"winapi-util","ecosystem":"cargo","requirements":"0.1.5","direct":false,"kind":"runtime","optional":false},{"id":11586629927,"package_name":"winapi-x86_64-pc-windows-gnu","ecosystem":"cargo","requirements":"0.4.0","direct":false,"kind":"runtime","optional":false},{"id":11586629928,"package_name":"windows-sys","ecosystem":"cargo","requirements":"0.42.0","direct":false,"kind":"runtime","optional":false},{"id":11586629929,"package_name":"windows-sys","ecosystem":"cargo","requirements":"0.48.0","direct":false,"kind":"runtime","optional":false},{"id":11586629930,"package_name":"windows-targets","ecosystem":"cargo","requirements":"0.48.0","direct":false,"kind":"runtime","optional":false},{"id":11586629931,"package_name":"windows_aarch64_gnullvm","ecosystem":"cargo","requirements":"0.42.2","direct":false,"kind":"runtime","optional":false},{"id":11586629932,"package_name":"windows_aarch64_gnullvm","ecosystem":"cargo","requirements":"0.48.0","direct":false,"kind":"runtime","optional":false},{"id":11586629933,"package_name":"windows_aarch64_msvc","ecosystem":"cargo","requirements":"0.42.2","direct":false,"kind":"runtime","optional":false},{"id":11586629934,"package_name":"windows_aarch64_msvc","ecosystem":"cargo","requirements":"0.48.0","direct":false,"kind":"runtime","optional":false},{"id":11586629935,"package_name":"windows_i686_gnu","ecosystem":"cargo","requirements":"0.42.2","direct":false,"kind":"runtime","optional":false},{"id":11586629936,"package_name":"windows_i686_gnu","ecosystem":"cargo","requirements":"0.48.0","direct":false,"kind":"runtime","optional":false},{"id":11586629937,"package_name":"windows_i686_msvc","ecosystem":"cargo","requirements":"0.42.2","direct":false,"kind":"runtime","optional":false},{"id":11586629938,"package_name":"windows_i686_msvc","ecosystem":"cargo","requirements":"0.48.0","direct":false,"kind":"runtime","optional":false},{"id":11586629939,"package_name":"windows_x86_64_gnu","ecosystem":"cargo","requirements":"0.42.2","direct":false,"kind":"runtime","optional":false},{"id":11586629940,"package_name":"windows_x86_64_gnu","ecosystem":"cargo","requirements":"0.48.0","direct":false,"kind":"runtime","optional":false},{"id":11586629941,"package_name":"windows_x86_64_gnullvm","ecosystem":"cargo","requirements":"0.42.2","direct":false,"kind":"runtime","optional":false},{"id":11586629942,"package_name":"windows_x86_64_gnullvm","ecosystem":"cargo","requirements":"0.48.0","direct":false,"kind":"runtime","optional":false},{"id":11586629943,"package_name":"windows_x86_64_msvc","ecosystem":"cargo","requirements":"0.42.2","direct":false,"kind":"runtime","optional":false},{"id":11586629944,"package_name":"windows_x86_64_msvc","ecosystem":"cargo","requirements":"0.48.0","direct":false,"kind":"runtime","optional":false},{"id":11586629945,"package_name":"xmlparser","ecosystem":"cargo","requirements":"0.13.5","direct":false,"kind":"runtime","optional":false},{"id":11586629946,"package_name":"zeroize","ecosystem":"cargo","requirements":"1.6.0","direct":false,"kind":"runtime","optional":false}]},{"ecosystem":"pypi","filepath":"pyproject.toml","sha":null,"kind":"manifest","created_at":"2023-07-17T00:31:34.556Z","updated_at":"2023-07-17T00:31:34.556Z","repository_link":"https://github.com/allenai/dolma/blob/main/pyproject.toml","dependencies":[{"id":11586630765,"package_name":"anyascii","ecosystem":"pypi","requirements":"\u003e=0.3.2","direct":true,"kind":"runtime","optional":false},{"id":11586630766,"package_name":"blingfire","ecosystem":"pypi","requirements":"==0.1.8","direct":true,"kind":"runtime","optional":false},{"id":11586630767,"package_name":"boto3","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11586630768,"package_name":"cached-path","ecosystem":"pypi","requirements":"==1.3.4","direct":true,"kind":"runtime","optional":false},{"id":11586630769,"package_name":"detect-secrets","ecosystem":"pypi","requirements":"==1.4.0","direct":true,"kind":"runtime","optional":false},{"id":11586630774,"package_name":"fasttext-wheel","ecosystem":"pypi","requirements":"==0.9.2","direct":true,"kind":"runtime","optional":false},{"id":11586630775,"package_name":"fsspec","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11586630776,"package_name":"msgspec","ecosystem":"pypi","requirements":"\u003e=0.14.2","direct":true,"kind":"runtime","optional":false},{"id":11586630777,"package_name":"nltk","ecosystem":"pypi","requirements":"==3.8.1","direct":true,"kind":"runtime","optional":false},{"id":11586630778,"package_name":"omegaconf","ecosystem":"pypi","requirements":"\u003e=2.3.0","direct":true,"kind":"runtime","optional":false},{"id":11586630779,"package_name":"presidio_analyzer","ecosystem":"pypi","requirements":"==2.2.32","direct":true,"kind":"runtime","optional":false},{"id":11586630780,"package_name":"pycld2","ecosystem":"pypi","requirements":"==0.41","direct":true,"kind":"runtime","optional":false},{"id":11586630781,"package_name":"pyyaml","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11586630782,"package_name":"requests","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11586630783,"package_name":"rich","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11586630784,"package_name":"s3fs","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11586630785,"package_name":"smart-open","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11586630786,"package_name":"tokenizers","ecosystem":"pypi","requirements":"\u003e=0.13.3,\u003c1.0.0","direct":true,"kind":"runtime","optional":false},{"id":11586630787,"package_name":"tqdm","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":11586630788,"package_name":"uniseg","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false}]},{"ecosystem":"actions","filepath":".github/workflows/ISSUE_TEMPLATE/bug_report.yml","sha":null,"kind":"manifest","created_at":"2023-09-24T03:46:33.253Z","updated_at":"2023-09-24T03:46:33.253Z","repository_link":"https://github.com/allenai/dolma/blob/main/.github/workflows/ISSUE_TEMPLATE/bug_report.yml","dependencies":[]},{"ecosystem":"actions","filepath":".github/workflows/ISSUE_TEMPLATE/documentation.yml","sha":null,"kind":"manifest","created_at":"2023-09-24T03:46:33.955Z","updated_at":"2023-09-24T03:46:33.955Z","repository_link":"https://github.com/allenai/dolma/blob/main/.github/workflows/ISSUE_TEMPLATE/documentation.yml","dependencies":[]},{"ecosystem":"actions","filepath":".github/workflows/ISSUE_TEMPLATE/feature_request.yml","sha":null,"kind":"manifest","created_at":"2023-09-24T03:46:34.770Z","updated_at":"2023-09-24T03:46:34.770Z","repository_link":"https://github.com/allenai/dolma/blob/main/.github/workflows/ISSUE_TEMPLATE/feature_request.yml","dependencies":[]},{"ecosystem":"actions","filepath":".github/workflows/ISSUE_TEMPLATE/question.yml","sha":null,"kind":"manifest","created_at":"2023-09-24T03:46:35.372Z","updated_at":"2023-09-24T03:46:35.372Z","repository_link":"https://github.com/allenai/dolma/blob/main/.github/workflows/ISSUE_TEMPLATE/question.yml","dependencies":[]},{"ecosystem":"cargo","filepath":"Cargo.toml","sha":null,"kind":"manifest","created_at":"2023-09-24T03:46:35.781Z","updated_at":"2023-09-24T03:46:35.781Z","repository_link":"https://github.com/allenai/dolma/blob/main/Cargo.toml","dependencies":[]},{"ecosystem":"pypi","filepath":"sources/reddit/atomic_content_v3/requirements.txt","sha":null,"kind":"manifest","created_at":"2023-12-15T23:50:59.895Z","updated_at":"2023-12-15T23:50:59.895Z","repository_link":"https://github.com/allenai/dolma/blob/main/sources/reddit/atomic_content_v3/requirements.txt","dependencies":[{"id":15118645486,"package_name":"apache-beam","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":15118645487,"package_name":"jsonlines","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false}]},{"ecosystem":"pypi","filepath":"sources/reddit/atomic_content_v3/setup.py","sha":null,"kind":"manifest","created_at":"2023-12-15T23:50:59.944Z","updated_at":"2023-12-15T23:50:59.944Z","repository_link":"https://github.com/allenai/dolma/blob/main/sources/reddit/atomic_content_v3/setup.py","dependencies":[{"id":15118645488,"package_name":"jsonlines","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false}]},{"ecosystem":"pypi","filepath":"sources/reddit/atomic_content_v5/requirements.txt","sha":null,"kind":"manifest","created_at":"2023-12-15T23:51:00.363Z","updated_at":"2023-12-15T23:51:00.363Z","repository_link":"https://github.com/allenai/dolma/blob/main/sources/reddit/atomic_content_v5/requirements.txt","dependencies":[{"id":15118645489,"package_name":"apache-beam","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":15118645490,"package_name":"jsonlines","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false}]},{"ecosystem":"pypi","filepath":"sources/reddit/atomic_content_v5/setup.py","sha":null,"kind":"manifest","created_at":"2023-12-15T23:51:00.515Z","updated_at":"2023-12-15T23:51:00.515Z","repository_link":"https://github.com/allenai/dolma/blob/main/sources/reddit/atomic_content_v5/setup.py","dependencies":[{"id":15118645491,"package_name":"jsonlines","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false}]},{"ecosystem":"pypi","filepath":"sources/reddit/comment_threads_v1/requirements.txt","sha":null,"kind":"manifest","created_at":"2023-12-15T23:51:00.569Z","updated_at":"2023-12-15T23:51:00.569Z","repository_link":"https://github.com/allenai/dolma/blob/main/sources/reddit/comment_threads_v1/requirements.txt","dependencies":[{"id":15118645492,"package_name":"apache-beam","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":15118645493,"package_name":"jsonlines","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":15118645494,"package_name":"datasets","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false}]},{"ecosystem":"pypi","filepath":"sources/reddit/comment_threads_v1/setup.py","sha":null,"kind":"manifest","created_at":"2023-12-15T23:51:00.720Z","updated_at":"2023-12-15T23:51:00.720Z","repository_link":"https://github.com/allenai/dolma/blob/main/sources/reddit/comment_threads_v1/setup.py","dependencies":[{"id":15118645495,"package_name":"jsonlines","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false}]},{"ecosystem":"pypi","filepath":"sources/reddit/comment_threads_v2/requirements.txt","sha":null,"kind":"manifest","created_at":"2023-12-15T23:51:00.804Z","updated_at":"2023-12-15T23:51:00.804Z","repository_link":"https://github.com/allenai/dolma/blob/main/sources/reddit/comment_threads_v2/requirements.txt","dependencies":[{"id":15118645496,"package_name":"apache-beam","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":15118645497,"package_name":"jsonlines","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":15118645498,"package_name":"datasets","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false}]},{"ecosystem":"pypi","filepath":"sources/reddit/comment_threads_v2/setup.py","sha":null,"kind":"manifest","created_at":"2023-12-15T23:51:00.904Z","updated_at":"2023-12-15T23:51:00.904Z","repository_link":"https://github.com/allenai/dolma/blob/main/sources/reddit/comment_threads_v2/setup.py","dependencies":[{"id":15118645499,"package_name":"jsonlines","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false}]},{"ecosystem":"pypi","filepath":"sources/reddit/complete_threads_codelike_v4/requirements.txt","sha":null,"kind":"manifest","created_at":"2023-12-15T23:51:00.971Z","updated_at":"2023-12-15T23:51:00.971Z","repository_link":"https://github.com/allenai/dolma/blob/main/sources/reddit/complete_threads_codelike_v4/requirements.txt","dependencies":[{"id":15118645500,"package_name":"apache-beam","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":15118645501,"package_name":"jsonlines","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":15118645502,"package_name":"datasets","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false}]},{"ecosystem":"pypi","filepath":"sources/reddit/complete_threads_codelike_v4/setup.py","sha":null,"kind":"manifest","created_at":"2023-12-15T23:51:01.089Z","updated_at":"2023-12-15T23:51:01.089Z","repository_link":"https://github.com/allenai/dolma/blob/main/sources/reddit/complete_threads_codelike_v4/setup.py","dependencies":[{"id":15118645503,"package_name":"jsonlines","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false}]},{"ecosystem":"pypi","filepath":"sources/starcoder/requirements.txt","sha":null,"kind":"manifest","created_at":"2023-12-15T23:51:01.352Z","updated_at":"2023-12-15T23:51:01.352Z","repository_link":"https://github.com/allenai/dolma/blob/main/sources/starcoder/requirements.txt","dependencies":[{"id":15118645509,"package_name":"pyarrow","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false}]}],"score":19.59299012323108,"created_at":"2025-09-04T15:51:30.353Z","updated_at":"2025-10-07T08:21:33.873Z","avatar_url":"https://github.com/allenai.png","language":"Python","category":null,"sub_category":null,"monthly_downloads":11143,"funding_links":[],"readme_doi_urls":[],"works":{},"citation_counts":{},"total_citations":0,"keywords_from_contributors":["transformers","cryptocurrencies","language-model","jax","embedded","cryptography","optim","interactive","spacy-extension","tokenizer"],"project_url":"https://science.ecosyste.ms/api/v1/projects/54668","html_url":"https://science.ecosyste.ms/projects/54668","bibtex_url":"https://science.ecosyste.ms/projects/54668/export.bibtex","apalike_url":"https://science.ecosyste.ms/projects/54668/export.apalike"}