{"id":146795,"name":null,"description":"Experiments on including metadata such as URLs, timestamps, website descriptions and HTML tags during pretraining.","url":"https://github.com/bigscience-workshop/metadata","last_synced_at":"2025-09-09T14:40:52.949Z","repository":{"id":37017711,"uuid":"388853237","full_name":"bigscience-workshop/metadata","owner":"bigscience-workshop","description":"Experiments on including metadata such as URLs, timestamps, website descriptions and HTML tags during pretraining.","archived":false,"fork":false,"pushed_at":"2023-06-12T08:48:03.000Z","size":949,"stargazers_count":31,"open_issues_count":38,"forks_count":11,"subscribers_count":18,"default_branch":"master","last_synced_at":"2025-06-13T11:26:18.517Z","etag":null,"topics":[],"latest_commit_sha":null,"homepage":null,"language":"Python","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"apache-2.0","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/bigscience-workshop.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":"LICENSE","code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null}},"created_at":"2021-07-23T15:55:42.000Z","updated_at":"2025-02-01T18:53:31.000Z","dependencies_parsed_at":"2024-11-11T06:02:17.611Z","dependency_job_id":null,"html_url":"https://github.com/bigscience-workshop/metadata","commit_stats":null,"previous_names":[],"tags_count":0,"template":false,"template_full_name":null,"purl":"pkg:github/bigscience-workshop/metadata","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/bigscience-workshop%2Fmetadata","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/bigscience-workshop%2Fmetadata/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/bigscience-workshop%2Fmetadata/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/bigscience-workshop%2Fmetadata/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/bigscience-workshop","download_url":"https://codeload.github.com/bigscience-workshop/metadata/tar.gz/refs/heads/master","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/bigscience-workshop%2Fmetadata/sbom","scorecard":null,"host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":274314279,"owners_count":25262605,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","status":"online","status_checked_at":"2025-09-09T02:00:10.223Z","response_time":80,"last_error":null,"robots_txt_status":"success","robots_txt_updated_at":"2025-07-24T06:49:26.215Z","robots_txt_url":"https://github.com/robots.txt","online":true,"can_crawl_api":true,"host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"owner":{"login":"bigscience-workshop","name":"BigScience Workshop","uuid":"82455566","kind":"organization","description":"Research workshop on large language models - The Summer of Language Models 21","email":"bigscience-contact@googlegroups.com","website":"https://bigscience.huggingface.co","location":null,"twitter":"BigScienceW","company":null,"icon_url":"https://avatars.githubusercontent.com/u/82455566?v=4","repositories_count":28,"last_synced_at":"2023-03-03T19:53:10.825Z","metadata":{"has_sponsors_listing":false},"html_url":"https://github.com/bigscience-workshop","funding_links":[],"total_stars":null,"followers":null,"following":null,"created_at":"2022-11-14T05:10:07.455Z","updated_at":"2023-03-03T19:53:10.861Z","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/bigscience-workshop","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/bigscience-workshop/repositories"},"packages":[],"commits":{"id":5057066,"full_name":"bigscience-workshop/metadata","default_branch":"master","committers":null,"total_commits":null,"total_committers":null,"total_bot_commits":null,"total_bot_committers":null,"mean_commits":null,"dds":null,"past_year_committers":null,"past_year_total_commits":null,"past_year_total_committers":null,"past_year_total_bot_commits":null,"past_year_total_bot_committers":null,"past_year_mean_commits":null,"past_year_dds":null,"last_synced_at":null,"last_synced_commit":null,"created_at":"2024-11-11T03:12:45.432Z","updated_at":"2024-11-11T03:12:45.432Z","commits_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub/repositories/bigscience-workshop%2Fmetadata/commits","host":{"name":"GitHub","url":"https://github.com","kind":"github","last_synced_at":"2025-09-09T00:17:06.873Z","repositories_count":5524511,"commits_count":868166479,"contributors_count":31942272,"owners_count":917070,"icon_url":"https://github.com/github.png","host_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub/repositories"}},"issues_stats":{"full_name":"bigscience-workshop/metadata","html_url":"https://github.com/bigscience-workshop/metadata","last_synced_at":"2024-11-11T03:13:35.402Z","status":null,"issues_count":51,"pull_requests_count":130,"avg_time_to_close_issue":7908443.1034482755,"avg_time_to_close_pull_request":2046837.341880342,"issues_closed_count":29,"pull_requests_closed_count":117,"pull_request_authors_count":11,"issue_authors_count":6,"avg_comments_per_issue":0.8823529411764706,"avg_comments_per_pull_request":0.8076923076923077,"merged_pull_requests_count":104,"bot_issues_count":0,"bot_pull_requests_count":0,"past_year_issues_count":0,"past_year_pull_requests_count":0,"past_year_avg_time_to_close_issue":null,"past_year_avg_time_to_close_pull_request":null,"past_year_issues_closed_count":0,"past_year_pull_requests_closed_count":0,"past_year_pull_request_authors_count":0,"past_year_issue_authors_count":0,"past_year_avg_comments_per_issue":null,"past_year_avg_comments_per_pull_request":null,"past_year_bot_issues_count":0,"past_year_bot_pull_requests_count":0,"past_year_merged_pull_requests_count":0,"created_at":"2024-11-11T03:12:48.518Z","updated_at":"2024-11-11T03:13:35.403Z","repository_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/bigscience-workshop%2Fmetadata","issues_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/bigscience-workshop%2Fmetadata/issues","issue_labels_count":{"enhancement":8,"wontfix":6,"#dataset":3,"duplicate":3,"question":1,"documentation":1,"bug":1,"Epic":1,"#paragraph_extraction":1},"pull_request_labels_count":{"enhancement":9,"bug":5,"#dataset":3,"#paragraph_extraction":1},"issue_author_associations_count":{"COLLABORATOR":46,"MEMBER":2},"pull_request_author_associations_count":{"COLLABORATOR":89,"MEMBER":20,"CONTRIBUTOR":18,"NONE":1},"issue_authors":{"norakassner":19,"SaulLu":13,"tianjianjiang":12,"manandey":2,"cccntu":1,"shanyas10":1},"pull_request_authors":{"SaulLu":33,"tianjianjiang":24,"cccntu":22,"manandey":20,"shanyas10":8,"jordiclive":7,"timoschick":5,"Muennighoff":3,"ppommer":3,"chkla":2,"masoudjs":1},"host":{"name":"GitHub","url":"https://github.com","kind":"github","last_synced_at":"2025-09-09T00:00:11.778Z","repositories_count":10190614,"issues_count":32231225,"pull_requests_count":101663549,"authors_count":10740619,"icon_url":"https://github.com/github.png","host_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories","owners_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/owners","authors_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors"},"past_year_issue_labels_count":{},"past_year_pull_request_labels_count":{},"past_year_issue_author_associations_count":{},"past_year_pull_request_author_associations_count":{},"past_year_issue_authors":{},"past_year_pull_request_authors":{},"maintainers":[{"login":"SaulLu","count":46,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/SaulLu"},{"login":"tianjianjiang","count":36,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/tianjianjiang"},{"login":"cccntu","count":23,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/cccntu"},{"login":"manandey","count":22,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/manandey"},{"login":"norakassner","count":19,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/norakassner"},{"login":"shanyas10","count":9,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/shanyas10"},{"login":"chkla","count":2,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/chkla"}],"active_maintainers":[]},"events":{"total":{"WatchEvent":1},"last_year":{"WatchEvent":1}},"keywords":[],"dependencies":[{"ecosystem":"actions","filepath":".github/workflows/code_quality.yml","sha":null,"kind":"manifest","created_at":"2023-02-14T14:46:18.682Z","updated_at":"2023-02-14T14:46:18.682Z","repository_link":"https://github.com/bigscience-workshop/metadata/blob/master/.github/workflows/code_quality.yml","dependencies":[{"id":7662290509,"package_name":"actions/checkout","ecosystem":"actions","requirements":"v3","direct":true,"kind":"composite","optional":false},{"id":7662290510,"package_name":"actions/setup-python","ecosystem":"actions","requirements":"v4","direct":true,"kind":"composite","optional":false}]},{"ecosystem":"actions","filepath":".github/workflows/test.yml","sha":null,"kind":"manifest","created_at":"2023-02-14T14:46:18.724Z","updated_at":"2023-02-14T14:46:18.724Z","repository_link":"https://github.com/bigscience-workshop/metadata/blob/master/.github/workflows/test.yml","dependencies":[{"id":7662290515,"package_name":"actions/checkout","ecosystem":"actions","requirements":"v3","direct":true,"kind":"composite","optional":false},{"id":7662290516,"package_name":"actions/setup-python","ecosystem":"actions","requirements":"v4","direct":true,"kind":"composite","optional":false}]},{"ecosystem":"pypi","filepath":"poetry.lock","sha":null,"kind":"lockfile","created_at":"2023-02-14T14:46:18.795Z","updated_at":"2023-02-14T14:46:18.795Z","repository_link":"https://github.com/bigscience-workshop/metadata/blob/master/poetry.lock","dependencies":[{"id":7662290960,"package_name":"accelerate","ecosystem":"pypi","requirements":"0.13.2","direct":false,"kind":"runtime","optional":false},{"id":7662290961,"package_name":"aiohttp","ecosystem":"pypi","requirements":"3.8.3","direct":false,"kind":"runtime","optional":false},{"id":7662290962,"package_name":"aiosignal","ecosystem":"pypi","requirements":"1.2.0","direct":false,"kind":"runtime","optional":false},{"id":7662290963,"package_name":"antlr4-python3-runtime","ecosystem":"pypi","requirements":"4.8","direct":false,"kind":"runtime","optional":false},{"id":7662290964,"package_name":"anyascii","ecosystem":"pypi","requirements":"0.3.1","direct":false,"kind":"runtime","optional":false},{"id":7662290965,"package_name":"async-timeout","ecosystem":"pypi","requirements":"4.0.2","direct":false,"kind":"runtime","optional":false},{"id":7662290966,"package_name":"asynctest","ecosystem":"pypi","requirements":"0.13.0","direct":false,"kind":"runtime","optional":false},{"id":7662290967,"package_name":"atomicwrites","ecosystem":"pypi","requirements":"1.4.1","direct":false,"kind":"runtime","optional":false},{"id":7662290968,"package_name":"attrs","ecosystem":"pypi","requirements":"22.1.0","direct":false,"kind":"runtime","optional":false},{"id":7662290969,"package_name":"black","ecosystem":"pypi","requirements":"22.10.0","direct":false,"kind":"develop","optional":false},{"id":7662290970,"package_name":"bpemb","ecosystem":"pypi","requirements":"0.3.4","direct":false,"kind":"runtime","optional":false},{"id":7662290971,"package_name":"bs-dateutil","ecosystem":"pypi","requirements":"2.8.5","direct":false,"kind":"runtime","optional":false},{"id":7662290972,"package_name":"certifi","ecosystem":"pypi","requirements":"2022.9.24","direct":false,"kind":"runtime","optional":false},{"id":7662290973,"package_name":"charset-normalizer","ecosystem":"pypi","requirements":"2.1.1","direct":false,"kind":"runtime","optional":false},{"id":7662290974,"package_name":"click","ecosystem":"pypi","requirements":"8.1.3","direct":false,"kind":"runtime","optional":false},{"id":7662290975,"package_name":"cloudpickle","ecosystem":"pypi","requirements":"2.2.0","direct":false,"kind":"runtime","optional":false},{"id":7662290976,"package_name":"colorama","ecosystem":"pypi","requirements":"0.4.6","direct":false,"kind":"runtime","optional":false},{"id":7662290977,"package_name":"cycler","ecosystem":"pypi","requirements":"0.11.0","direct":false,"kind":"runtime","optional":false},{"id":7662290978,"package_name":"cython","ecosystem":"pypi","requirements":"0.29.14","direct":false,"kind":"runtime","optional":false},{"id":7662291067,"package_name":"datasets","ecosystem":"pypi","requirements":"2.6.1","direct":false,"kind":"runtime","optional":false},{"id":7662291192,"package_name":"deepspeed","ecosystem":"pypi","requirements":"0.7.4","direct":false,"kind":"runtime","optional":false},{"id":7662291193,"package_name":"deprecated","ecosystem":"pypi","requirements":"1.2.13","direct":false,"kind":"runtime","optional":false},{"id":7662291194,"package_name":"dill","ecosystem":"pypi","requirements":"0.3.5.1","direct":false,"kind":"runtime","optional":false},{"id":7662291195,"package_name":"docker-pycreds","ecosystem":"pypi","requirements":"0.4.0","direct":false,"kind":"runtime","optional":false},{"id":7662291196,"package_name":"filelock","ecosystem":"pypi","requirements":"3.8.0","direct":false,"kind":"runtime","optional":false},{"id":7662291197,"package_name":"flair","ecosystem":"pypi","requirements":"0.5.1","direct":false,"kind":"runtime","optional":false},{"id":7662291209,"package_name":"flake8","ecosystem":"pypi","requirements":"5.0.4","direct":false,"kind":"develop","optional":false},{"id":7662291212,"package_name":"fonttools","ecosystem":"pypi","requirements":"4.38.0","direct":false,"kind":"runtime","optional":false},{"id":7662291213,"package_name":"frozenlist","ecosystem":"pypi","requirements":"1.3.1","direct":false,"kind":"runtime","optional":false},{"id":7662291214,"package_name":"fsspec","ecosystem":"pypi","requirements":"2022.10.0","direct":false,"kind":"runtime","optional":false},{"id":7662291215,"package_name":"future","ecosystem":"pypi","requirements":"0.18.2","direct":false,"kind":"runtime","optional":false},{"id":7662291216,"package_name":"gensim","ecosystem":"pypi","requirements":"3.8.3","direct":false,"kind":"runtime","optional":false},{"id":7662291217,"package_name":"gitdb","ecosystem":"pypi","requirements":"4.0.9","direct":false,"kind":"runtime","optional":false},{"id":7662291218,"package_name":"gitpython","ecosystem":"pypi","requirements":"3.1.29","direct":false,"kind":"runtime","optional":false},{"id":7662291219,"package_name":"hjson","ecosystem":"pypi","requirements":"3.1.0","direct":false,"kind":"runtime","optional":false},{"id":7662291220,"package_name":"htmlmin","ecosystem":"pypi","requirements":"0.1.12","direct":false,"kind":"runtime","optional":false},{"id":7662291221,"package_name":"huggingface-hub","ecosystem":"pypi","requirements":"0.10.1","direct":false,"kind":"runtime","optional":false},{"id":7662291222,"package_name":"hydra-core","ecosystem":"pypi","requirements":"1.1.2","direct":false,"kind":"runtime","optional":false},{"id":7662291223,"package_name":"hyperopt","ecosystem":"pypi","requirements":"0.2.7","direct":false,"kind":"runtime","optional":false},{"id":7662291224,"package_name":"idna","ecosystem":"pypi","requirements":"3.4","direct":false,"kind":"runtime","optional":false},{"id":7662291225,"package_name":"importlib-metadata","ecosystem":"pypi","requirements":"4.2.0","direct":false,"kind":"runtime","optional":false},{"id":7662291226,"package_name":"importlib-resources","ecosystem":"pypi","requirements":"5.2.3","direct":false,"kind":"runtime","optional":false},{"id":7662291227,"package_name":"iniconfig","ecosystem":"pypi","requirements":"1.1.1","direct":false,"kind":"runtime","optional":false},{"id":7662291228,"package_name":"isort","ecosystem":"pypi","requirements":"5.10.1","direct":false,"kind":"develop","optional":false},{"id":7662291229,"package_name":"jieba","ecosystem":"pypi","requirements":"0.42.1","direct":false,"kind":"runtime","optional":false},{"id":7662291230,"package_name":"joblib","ecosystem":"pypi","requirements":"1.2.0","direct":false,"kind":"runtime","optional":false},{"id":7662291231,"package_name":"kiwisolver","ecosystem":"pypi","requirements":"1.4.4","direct":false,"kind":"runtime","optional":false},{"id":7662291232,"package_name":"konoha","ecosystem":"pypi","requirements":"5.3.0","direct":false,"kind":"runtime","optional":false},{"id":7662291233,"package_name":"langdetect","ecosystem":"pypi","requirements":"1.0.9","direct":false,"kind":"runtime","optional":false},{"id":7662291235,"package_name":"lmdb","ecosystem":"pypi","requirements":"1.3.0","direct":false,"kind":"runtime","optional":false},{"id":7662291236,"package_name":"loguru","ecosystem":"pypi","requirements":"0.6.0","direct":false,"kind":"runtime","optional":false},{"id":7662291237,"package_name":"lxml","ecosystem":"pypi","requirements":"4.6.5","direct":false,"kind":"runtime","optional":false},{"id":7662291238,"package_name":"marisa-trie","ecosystem":"pypi","requirements":"0.7.8","direct":false,"kind":"runtime","optional":false},{"id":7662291247,"package_name":"matplotlib","ecosystem":"pypi","requirements":"3.5.3","direct":false,"kind":"runtime","optional":false},{"id":7662291248,"package_name":"mccabe","ecosystem":"pypi","requirements":"0.7.0","direct":false,"kind":"develop","optional":false},{"id":7662291249,"package_name":"mpld3","ecosystem":"pypi","requirements":"0.3","direct":false,"kind":"runtime","optional":false},{"id":7662291250,"package_name":"multidict","ecosystem":"pypi","requirements":"6.0.2","direct":false,"kind":"runtime","optional":false},{"id":7662291251,"package_name":"multiprocess","ecosystem":"pypi","requirements":"0.70.13","direct":false,"kind":"runtime","optional":false},{"id":7662291252,"package_name":"mwparserfromhell","ecosystem":"pypi","requirements":"0.6.4","direct":false,"kind":"runtime","optional":false},{"id":7662291253,"package_name":"mypy-extensions","ecosystem":"pypi","requirements":"0.4.3","direct":false,"kind":"develop","optional":false},{"id":7662291254,"package_name":"networkx","ecosystem":"pypi","requirements":"2.6.3","direct":false,"kind":"runtime","optional":false},{"id":7662291255,"package_name":"ninja","ecosystem":"pypi","requirements":"1.10.2.4","direct":false,"kind":"runtime","optional":false},{"id":7662291256,"package_name":"nltk","ecosystem":"pypi","requirements":"3.6.7","direct":false,"kind":"runtime","optional":false},{"id":7662291257,"package_name":"numpy","ecosystem":"pypi","requirements":"1.21.6","direct":false,"kind":"runtime","optional":false},{"id":7662291258,"package_name":"numpy","ecosystem":"pypi","requirements":"1.22.4","direct":false,"kind":"runtime","optional":false},{"id":7662291259,"package_name":"omegaconf","ecosystem":"pypi","requirements":"2.1.2","direct":false,"kind":"runtime","optional":false},{"id":7662291260,"package_name":"overrides","ecosystem":"pypi","requirements":"3.1.0","direct":false,"kind":"runtime","optional":false},{"id":7662291261,"package_name":"packaging","ecosystem":"pypi","requirements":"21.3","direct":false,"kind":"runtime","optional":false},{"id":7662291262,"package_name":"pandas","ecosystem":"pypi","requirements":"1.3.5","direct":false,"kind":"runtime","optional":false},{"id":7662291263,"package_name":"pandas","ecosystem":"pypi","requirements":"1.5.1","direct":false,"kind":"runtime","optional":false},{"id":7662291264,"package_name":"pathspec","ecosystem":"pypi","requirements":"0.10.1","direct":false,"kind":"develop","optional":false},{"id":7662291265,"package_name":"pathtools","ecosystem":"pypi","requirements":"0.1.2","direct":false,"kind":"runtime","optional":false},{"id":7662291266,"package_name":"pillow","ecosystem":"pypi","requirements":"9.2.0","direct":false,"kind":"runtime","optional":false},{"id":7662291267,"package_name":"platformdirs","ecosystem":"pypi","requirements":"2.5.2","direct":false,"kind":"develop","optional":false},{"id":7662291268,"package_name":"pluggy","ecosystem":"pypi","requirements":"0.13.1","direct":false,"kind":"runtime","optional":false},{"id":7662291269,"package_name":"promise","ecosystem":"pypi","requirements":"2.3","direct":false,"kind":"runtime","optional":false},{"id":7662291270,"package_name":"protobuf","ecosystem":"pypi","requirements":"4.21.9","direct":false,"kind":"runtime","optional":false},{"id":7662291271,"package_name":"psutil","ecosystem":"pypi","requirements":"5.9.3","direct":false,"kind":"runtime","optional":false},{"id":7662291272,"package_name":"py","ecosystem":"pypi","requirements":"1.11.0","direct":false,"kind":"runtime","optional":false},{"id":7662291273,"package_name":"py-cpuinfo","ecosystem":"pypi","requirements":"9.0.0","direct":false,"kind":"runtime","optional":false},{"id":7662291274,"package_name":"py4j","ecosystem":"pypi","requirements":"0.10.9.7","direct":false,"kind":"runtime","optional":false},{"id":7662291275,"package_name":"pyarrow","ecosystem":"pypi","requirements":"7.0.0","direct":false,"kind":"runtime","optional":false},{"id":7662291276,"package_name":"pycodestyle","ecosystem":"pypi","requirements":"2.9.1","direct":false,"kind":"develop","optional":false},{"id":7662291277,"package_name":"pydantic","ecosystem":"pypi","requirements":"1.10.2","direct":false,"kind":"runtime","optional":false},{"id":7662291278,"package_name":"pyflakes","ecosystem":"pypi","requirements":"2.5.0","direct":false,"kind":"develop","optional":false},{"id":7662291279,"package_name":"pyparsing","ecosystem":"pypi","requirements":"3.0.9","direct":false,"kind":"runtime","optional":false},{"id":7662291280,"package_name":"pytest","ecosystem":"pypi","requirements":"6.2.4","direct":false,"kind":"runtime","optional":false},{"id":7662291281,"package_name":"python-dateutil","ecosystem":"pypi","requirements":"2.8.2","direct":false,"kind":"runtime","optional":false},{"id":7662291282,"package_name":"pytz","ecosystem":"pypi","requirements":"2022.5","direct":false,"kind":"runtime","optional":false},{"id":7662291283,"package_name":"pyyaml","ecosystem":"pypi","requirements":"6.0","direct":false,"kind":"runtime","optional":false},{"id":7662291284,"package_name":"regex","ecosystem":"pypi","requirements":"2022.9.13","direct":false,"kind":"runtime","optional":false},{"id":7662291285,"package_name":"REL","ecosystem":"pypi","requirements":"0.0.1","direct":false,"kind":"runtime","optional":false},{"id":7662291286,"package_name":"requests","ecosystem":"pypi","requirements":"2.28.1","direct":false,"kind":"runtime","optional":false},{"id":7662291287,"package_name":"responses","ecosystem":"pypi","requirements":"0.18.0","direct":false,"kind":"runtime","optional":false},{"id":7662291288,"package_name":"scikit-learn","ecosystem":"pypi","requirements":"1.0.2","direct":false,"kind":"runtime","optional":false},{"id":7662291289,"package_name":"scipy","ecosystem":"pypi","requirements":"1.7.3","direct":false,"kind":"runtime","optional":false},{"id":7662291290,"package_name":"segtok","ecosystem":"pypi","requirements":"1.5.11","direct":false,"kind":"runtime","optional":false},{"id":7662291291,"package_name":"sentencepiece","ecosystem":"pypi","requirements":"0.1.97","direct":false,"kind":"runtime","optional":false},{"id":7662291292,"package_name":"sentry-sdk","ecosystem":"pypi","requirements":"1.10.1","direct":false,"kind":"runtime","optional":false},{"id":7662291293,"package_name":"setproctitle","ecosystem":"pypi","requirements":"1.3.2","direct":false,"kind":"runtime","optional":false},{"id":7662291294,"package_name":"setuptools","ecosystem":"pypi","requirements":"62.6.0","direct":false,"kind":"runtime","optional":false},{"id":7662291295,"package_name":"setuptools-scm","ecosystem":"pypi","requirements":"6.4.2","direct":false,"kind":"runtime","optional":false},{"id":7662291296,"package_name":"shortuuid","ecosystem":"pypi","requirements":"1.0.9","direct":false,"kind":"runtime","optional":false},{"id":7662291297,"package_name":"six","ecosystem":"pypi","requirements":"1.16.0","direct":false,"kind":"runtime","optional":false},{"id":7662291298,"package_name":"smart-open","ecosystem":"pypi","requirements":"6.2.0","direct":false,"kind":"runtime","optional":false},{"id":7662291299,"package_name":"smmap","ecosystem":"pypi","requirements":"5.0.0","direct":false,"kind":"runtime","optional":false},{"id":7662291300,"package_name":"sqlitedict","ecosystem":"pypi","requirements":"2.0.0","direct":false,"kind":"runtime","optional":false},{"id":7662291301,"package_name":"tabulate","ecosystem":"pypi","requirements":"0.9.0","direct":false,"kind":"runtime","optional":false},{"id":7662291302,"package_name":"threadpoolctl","ecosystem":"pypi","requirements":"3.1.0","direct":false,"kind":"runtime","optional":false},{"id":7662291303,"package_name":"tokenizers","ecosystem":"pypi","requirements":"0.13.1","direct":false,"kind":"runtime","optional":false},{"id":7662291304,"package_name":"toml","ecosystem":"pypi","requirements":"0.10.2","direct":false,"kind":"runtime","optional":false},{"id":7662291305,"package_name":"tomli","ecosystem":"pypi","requirements":"2.0.1","direct":false,"kind":"runtime","optional":false},{"id":7662291306,"package_name":"torch","ecosystem":"pypi","requirements":"1.9.0","direct":false,"kind":"runtime","optional":false},{"id":7662291307,"package_name":"tqdm","ecosystem":"pypi","requirements":"4.64.1","direct":false,"kind":"runtime","optional":false},{"id":7662291308,"package_name":"transformers","ecosystem":"pypi","requirements":"4.23.1","direct":false,"kind":"runtime","optional":false},{"id":7662291309,"package_name":"typed-ast","ecosystem":"pypi","requirements":"1.5.4","direct":false,"kind":"develop","optional":false},{"id":7662291310,"package_name":"typing-extensions","ecosystem":"pypi","requirements":"4.4.0","direct":false,"kind":"runtime","optional":false},{"id":7662291311,"package_name":"urllib3","ecosystem":"pypi","requirements":"1.26.12","direct":false,"kind":"runtime","optional":false},{"id":7662291312,"package_name":"wandb","ecosystem":"pypi","requirements":"0.13.4","direct":false,"kind":"runtime","optional":false},{"id":7662291313,"package_name":"wheel","ecosystem":"pypi","requirements":"0.37.1","direct":false,"kind":"runtime","optional":false},{"id":7662291314,"package_name":"wikipedia2vec","ecosystem":"pypi","requirements":"1.0.5","direct":false,"kind":"runtime","optional":false},{"id":7662291315,"package_name":"win32-setctime","ecosystem":"pypi","requirements":"1.1.0","direct":false,"kind":"runtime","optional":false},{"id":7662291316,"package_name":"wrapt","ecosystem":"pypi","requirements":"1.14.1","direct":false,"kind":"runtime","optional":false},{"id":7662291317,"package_name":"xxhash","ecosystem":"pypi","requirements":"3.1.0","direct":false,"kind":"runtime","optional":false},{"id":7662291318,"package_name":"yarl","ecosystem":"pypi","requirements":"1.8.1","direct":false,"kind":"runtime","optional":false},{"id":7662291319,"package_name":"zipp","ecosystem":"pypi","requirements":"3.10.0","direct":false,"kind":"runtime","optional":false}]},{"ecosystem":"pypi","filepath":"requirements-dev.txt","sha":null,"kind":"manifest","created_at":"2023-02-14T14:46:19.027Z","updated_at":"2023-02-14T14:46:19.027Z","repository_link":"https://github.com/bigscience-workshop/metadata/blob/master/requirements-dev.txt","dependencies":[{"id":7662291680,"package_name":"isort","ecosystem":"pypi","requirements":"\u003e=5.5.4","direct":true,"kind":"development","optional":false},{"id":7662291681,"package_name":"black","ecosystem":"pypi","requirements":"\u003e=22.3.0","direct":true,"kind":"development","optional":false},{"id":7662291682,"package_name":"flake8","ecosystem":"pypi","requirements":"\u003e=3.8.3","direct":true,"kind":"development","optional":false},{"id":7662291683,"package_name":"pytest","ecosystem":"pypi","requirements":"==6.2.4","direct":true,"kind":"development","optional":false}]},{"ecosystem":"pypi","filepath":"requirements.txt","sha":null,"kind":"manifest","created_at":"2023-02-14T14:46:19.133Z","updated_at":"2023-02-14T14:46:19.133Z","repository_link":"https://github.com/bigscience-workshop/metadata/blob/master/requirements.txt","dependencies":[{"id":7662291710,"package_name":"pyarrow","ecosystem":"pypi","requirements":"\u003e=7.0.0,\u003c8","direct":true,"kind":"runtime","optional":false},{"id":7662291711,"package_name":"numpy","ecosystem":"pypi","requirements":"\u003c1.22","direct":true,"kind":"runtime","optional":false},{"id":7662291712,"package_name":"numpy","ecosystem":"pypi","requirements":"\u003e=1.22","direct":true,"kind":"runtime","optional":false},{"id":7662291713,"package_name":"pandas","ecosystem":"pypi","requirements":"\u003c1.4","direct":true,"kind":"runtime","optional":false},{"id":7662291714,"package_name":"pandas","ecosystem":"pypi","requirements":"\u003e=1.4","direct":true,"kind":"runtime","optional":false},{"id":7662291715,"package_name":"datasets","ecosystem":"pypi","requirements":"\u003e=1.18.4","direct":true,"kind":"runtime","optional":false},{"id":7662291716,"package_name":"tokenizers","ecosystem":"pypi","requirements":"*","direct":true,"kind":"runtime","optional":false},{"id":7662291717,"package_name":"transformers","ecosystem":"pypi","requirements":"\u003e=4.22,\u003c5","direct":true,"kind":"runtime","optional":false},{"id":7662291718,"package_name":"accelerate","ecosystem":"pypi","requirements":"\u003e=0.4.0,\u003c1","direct":true,"kind":"runtime","optional":false},{"id":7662291719,"package_name":"hydra_core","ecosystem":"pypi","requirements":"\u003e=1.1,\u003c1.2","direct":true,"kind":"runtime","optional":false},{"id":7662291720,"package_name":"wandb","ecosystem":"pypi","requirements":"\u003e=0.10.32,\u003c1","direct":true,"kind":"runtime","optional":false},{"id":7662291721,"package_name":"gensim","ecosystem":"pypi","requirements":"\u003e=3.8.3,\u003c4","direct":true,"kind":"runtime","optional":false},{"id":7662291722,"package_name":"nltk","ecosystem":"pypi","requirements":"==3.6.7","direct":true,"kind":"runtime","optional":false},{"id":7662291723,"package_name":"lxml","ecosystem":"pypi","requirements":"==4.6.5","direct":true,"kind":"runtime","optional":false},{"id":7662291724,"package_name":"htmlmin","ecosystem":"pypi","requirements":"==0.1.12","direct":true,"kind":"runtime","optional":false},{"id":7662291725,"package_name":"loguru","ecosystem":"pypi","requirements":"\u003e=0.6.0","direct":true,"kind":"runtime","optional":false},{"id":7662291726,"package_name":"deepspeed","ecosystem":"pypi","requirements":"\u003e=0.6.1","direct":true,"kind":"runtime","optional":false}]},{"ecosystem":"pypi","filepath":"requirements_resolved_with_extras_and_dev.txt","sha":null,"kind":"manifest","created_at":"2023-02-14T14:46:19.182Z","updated_at":"2023-02-14T14:46:19.182Z","repository_link":"https://github.com/bigscience-workshop/metadata/blob/master/requirements_resolved_with_extras_and_dev.txt","dependencies":[{"id":7662291779,"package_name":"accelerate","ecosystem":"pypi","requirements":"==0.13.2","direct":true,"kind":"development","optional":false},{"id":7662291780,"package_name":"aiohttp","ecosystem":"pypi","requirements":"==3.8.3","direct":true,"kind":"development","optional":false},{"id":7662291781,"package_name":"aiosignal","ecosystem":"pypi","requirements":"==1.2.0","direct":true,"kind":"development","optional":false},{"id":7662291782,"package_name":"antlr4-python3-runtime","ecosystem":"pypi","requirements":"==4.8","direct":true,"kind":"development","optional":false},{"id":7662291783,"package_name":"anyascii","ecosystem":"pypi","requirements":"==0.3.1","direct":true,"kind":"development","optional":false},{"id":7662291784,"package_name":"async-timeout","ecosystem":"pypi","requirements":"==4.0.2","direct":true,"kind":"development","optional":false},{"id":7662291785,"package_name":"asynctest","ecosystem":"pypi","requirements":"==0.13.0","direct":true,"kind":"development","optional":false},{"id":7662291786,"package_name":"atomicwrites","ecosystem":"pypi","requirements":"==1.4.1","direct":true,"kind":"development","optional":false},{"id":7662291787,"package_name":"attrs","ecosystem":"pypi","requirements":"==22.1.0","direct":true,"kind":"development","optional":false},{"id":7662291788,"package_name":"black","ecosystem":"pypi","requirements":"==22.10.0","direct":true,"kind":"development","optional":false},{"id":7662291789,"package_name":"bpemb","ecosystem":"pypi","requirements":"==0.3.4","direct":true,"kind":"development","optional":false},{"id":7662291790,"package_name":"certifi","ecosystem":"pypi","requirements":"==2022.9.24","direct":true,"kind":"development","optional":false},{"id":7662291791,"package_name":"charset-normalizer","ecosystem":"pypi","requirements":"==2.1.1","direct":true,"kind":"development","optional":false},{"id":7662291792,"package_name":"click","ecosystem":"pypi","requirements":"==8.1.3","direct":true,"kind":"development","optional":false},{"id":7662291793,"package_name":"cloudpickle","ecosystem":"pypi","requirements":"==2.2.0","direct":true,"kind":"development","optional":false},{"id":7662291794,"package_name":"colorama","ecosystem":"pypi","requirements":"==0.4.6","direct":true,"kind":"development","optional":false},{"id":7662291795,"package_name":"cycler","ecosystem":"pypi","requirements":"==0.11.0","direct":true,"kind":"development","optional":false},{"id":7662291796,"package_name":"cython","ecosystem":"pypi","requirements":"==0.29.14","direct":true,"kind":"development","optional":false},{"id":7662291797,"package_name":"datasets","ecosystem":"pypi","requirements":"==2.6.1","direct":true,"kind":"development","optional":false},{"id":7662291798,"package_name":"deepspeed","ecosystem":"pypi","requirements":"==0.7.4","direct":true,"kind":"development","optional":false},{"id":7662291799,"package_name":"deprecated","ecosystem":"pypi","requirements":"==1.2.13","direct":true,"kind":"development","optional":false},{"id":7662291800,"package_name":"dill","ecosystem":"pypi","requirements":"==0.3.5.1","direct":true,"kind":"development","optional":false},{"id":7662291801,"package_name":"docker-pycreds","ecosystem":"pypi","requirements":"==0.4.0","direct":true,"kind":"development","optional":false},{"id":7662291802,"package_name":"filelock","ecosystem":"pypi","requirements":"==3.8.0","direct":true,"kind":"development","optional":false},{"id":7662291803,"package_name":"flair","ecosystem":"pypi","requirements":"==0.5.1","direct":true,"kind":"development","optional":false},{"id":7662291804,"package_name":"flake8","ecosystem":"pypi","requirements":"==5.0.4","direct":true,"kind":"development","optional":false},{"id":7662291805,"package_name":"fonttools","ecosystem":"pypi","requirements":"==4.38.0","direct":true,"kind":"development","optional":false},{"id":7662291806,"package_name":"frozenlist","ecosystem":"pypi","requirements":"==1.3.1","direct":true,"kind":"development","optional":false},{"id":7662291807,"package_name":"fsspec","ecosystem":"pypi","requirements":"==2022.10.0","direct":true,"kind":"development","optional":false},{"id":7662291808,"package_name":"future","ecosystem":"pypi","requirements":"==0.18.2","direct":true,"kind":"development","optional":false},{"id":7662291809,"package_name":"gensim","ecosystem":"pypi","requirements":"==3.8.3","direct":true,"kind":"development","optional":false},{"id":7662291810,"package_name":"gitdb","ecosystem":"pypi","requirements":"==4.0.9","direct":true,"kind":"development","optional":false},{"id":7662291811,"package_name":"gitpython","ecosystem":"pypi","requirements":"==3.1.29","direct":true,"kind":"development","optional":false},{"id":7662291812,"package_name":"hjson","ecosystem":"pypi","requirements":"==3.1.0","direct":true,"kind":"development","optional":false},{"id":7662291813,"package_name":"htmlmin","ecosystem":"pypi","requirements":"==0.1.12","direct":true,"kind":"development","optional":false},{"id":7662291814,"package_name":"huggingface-hub","ecosystem":"pypi","requirements":"==0.10.1","direct":true,"kind":"development","optional":false},{"id":7662291815,"package_name":"hydra-core","ecosystem":"pypi","requirements":"==1.1.2","direct":true,"kind":"development","optional":false},{"id":7662291816,"package_name":"hyperopt","ecosystem":"pypi","requirements":"==0.2.7","direct":true,"kind":"development","optional":false},{"id":7662291817,"package_name":"idna","ecosystem":"pypi","requirements":"==3.4","direct":true,"kind":"development","optional":false},{"id":7662291818,"package_name":"importlib-metadata","ecosystem":"pypi","requirements":"==4.2.0","direct":true,"kind":"development","optional":false},{"id":7662291819,"package_name":"importlib-resources","ecosystem":"pypi","requirements":"==5.2.3","direct":true,"kind":"development","optional":false},{"id":7662291820,"package_name":"iniconfig","ecosystem":"pypi","requirements":"==1.1.1","direct":true,"kind":"development","optional":false},{"id":7662291821,"package_name":"isort","ecosystem":"pypi","requirements":"==5.10.1","direct":true,"kind":"development","optional":false},{"id":7662291822,"package_name":"jieba","ecosystem":"pypi","requirements":"==0.42.1","direct":true,"kind":"development","optional":false},{"id":7662291823,"package_name":"joblib","ecosystem":"pypi","requirements":"==1.2.0","direct":true,"kind":"development","optional":false},{"id":7662291824,"package_name":"kiwisolver","ecosystem":"pypi","requirements":"==1.4.4","direct":true,"kind":"development","optional":false},{"id":7662291825,"package_name":"konoha","ecosystem":"pypi","requirements":"==5.3.0","direct":true,"kind":"development","optional":false},{"id":7662291826,"package_name":"langdetect","ecosystem":"pypi","requirements":"==1.0.9","direct":true,"kind":"development","optional":false},{"id":7662291827,"package_name":"lmdb","ecosystem":"pypi","requirements":"==1.3.0","direct":true,"kind":"development","optional":false},{"id":7662291828,"package_name":"loguru","ecosystem":"pypi","requirements":"==0.6.0","direct":true,"kind":"development","optional":false},{"id":7662291829,"package_name":"lxml","ecosystem":"pypi","requirements":"==4.6.5","direct":true,"kind":"development","optional":false},{"id":7662291830,"package_name":"marisa-trie","ecosystem":"pypi","requirements":"==0.7.8","direct":true,"kind":"development","optional":false},{"id":7662291831,"package_name":"matplotlib","ecosystem":"pypi","requirements":"==3.5.3","direct":true,"kind":"development","optional":false},{"id":7662291832,"package_name":"mccabe","ecosystem":"pypi","requirements":"==0.7.0","direct":true,"kind":"development","optional":false},{"id":7662291833,"package_name":"mpld3","ecosystem":"pypi","requirements":"==0.3","direct":true,"kind":"development","optional":false},{"id":7662291834,"package_name":"multidict","ecosystem":"pypi","requirements":"==6.0.2","direct":true,"kind":"development","optional":false},{"id":7662291835,"package_name":"multiprocess","ecosystem":"pypi","requirements":"==0.70.13","direct":true,"kind":"development","optional":false},{"id":7662291836,"package_name":"mwparserfromhell","ecosystem":"pypi","requirements":"==0.6.4","direct":true,"kind":"development","optional":false},{"id":7662291837,"package_name":"mypy-extensions","ecosystem":"pypi","requirements":"==0.4.3","direct":true,"kind":"development","optional":false},{"id":7662291838,"package_name":"networkx","ecosystem":"pypi","requirements":"==2.6.3","direct":true,"kind":"development","optional":false},{"id":7662291839,"package_name":"ninja","ecosystem":"pypi","requirements":"==1.10.2.4","direct":true,"kind":"development","optional":false},{"id":7662291840,"package_name":"nltk","ecosystem":"pypi","requirements":"==3.6.7","direct":true,"kind":"development","optional":false},{"id":7662291841,"package_name":"numpy","ecosystem":"pypi","requirements":"==1.21.6","direct":true,"kind":"development","optional":false},{"id":7662291842,"package_name":"numpy","ecosystem":"pypi","requirements":"==1.22.4","direct":true,"kind":"development","optional":false},{"id":7662291843,"package_name":"omegaconf","ecosystem":"pypi","requirements":"==2.1.2","direct":true,"kind":"development","optional":false},{"id":7662291844,"package_name":"overrides","ecosystem":"pypi","requirements":"==3.1.0","direct":true,"kind":"development","optional":false},{"id":7662291845,"package_name":"packaging","ecosystem":"pypi","requirements":"==21.3","direct":true,"kind":"development","optional":false},{"id":7662291846,"package_name":"pandas","ecosystem":"pypi","requirements":"==1.3.5","direct":true,"kind":"development","optional":false},{"id":7662291847,"package_name":"pandas","ecosystem":"pypi","requirements":"==1.5.1","direct":true,"kind":"development","optional":false},{"id":7662291848,"package_name":"pathspec","ecosystem":"pypi","requirements":"==0.10.1","direct":true,"kind":"development","optional":false},{"id":7662291849,"package_name":"pathtools","ecosystem":"pypi","requirements":"==0.1.2","direct":true,"kind":"development","optional":false},{"id":7662291850,"package_name":"pillow","ecosystem":"pypi","requirements":"==9.2.0","direct":true,"kind":"development","optional":false},{"id":7662291851,"package_name":"platformdirs","ecosystem":"pypi","requirements":"==2.5.2","direct":true,"kind":"development","optional":false},{"id":7662291852,"package_name":"pluggy","ecosystem":"pypi","requirements":"==0.13.1","direct":true,"kind":"development","optional":false},{"id":7662291853,"package_name":"promise","ecosystem":"pypi","requirements":"==2.3","direct":true,"kind":"development","optional":false},{"id":7662291854,"package_name":"protobuf","ecosystem":"pypi","requirements":"==4.21.9","direct":true,"kind":"development","optional":false},{"id":7662291855,"package_name":"psutil","ecosystem":"pypi","requirements":"==5.9.3","direct":true,"kind":"development","optional":false},{"id":7662291856,"package_name":"py-cpuinfo","ecosystem":"pypi","requirements":"==9.0.0","direct":true,"kind":"development","optional":false},{"id":7662291857,"package_name":"py4j","ecosystem":"pypi","requirements":"==0.10.9.7","direct":true,"kind":"development","optional":false},{"id":7662291858,"package_name":"py","ecosystem":"pypi","requirements":"==1.11.0","direct":true,"kind":"development","optional":false},{"id":7662291859,"package_name":"pyarrow","ecosystem":"pypi","requirements":"==7.0.0","direct":true,"kind":"development","optional":false},{"id":7662291860,"package_name":"pycodestyle","ecosystem":"pypi","requirements":"==2.9.1","direct":true,"kind":"development","optional":false},{"id":7662291861,"package_name":"pydantic","ecosystem":"pypi","requirements":"==1.10.2","direct":true,"kind":"development","optional":false},{"id":7662291862,"package_name":"pyflakes","ecosystem":"pypi","requirements":"==2.5.0","direct":true,"kind":"development","optional":false},{"id":7662291863,"package_name":"pyparsing","ecosystem":"pypi","requirements":"==3.0.9","direct":true,"kind":"development","optional":false},{"id":7662291864,"package_name":"pytest","ecosystem":"pypi","requirements":"==6.2.4","direct":true,"kind":"development","optional":false},{"id":7662291865,"package_name":"python-dateutil","ecosystem":"pypi","requirements":"==2.8.2","direct":true,"kind":"development","optional":false},{"id":7662291866,"package_name":"pytz","ecosystem":"pypi","requirements":"==2022.5","direct":true,"kind":"development","optional":false},{"id":7662291867,"package_name":"pyyaml","ecosystem":"pypi","requirements":"==6.0","direct":true,"kind":"development","optional":false},{"id":7662291868,"package_name":"regex","ecosystem":"pypi","requirements":"==2022.9.13","direct":true,"kind":"development","optional":false},{"id":7662291869,"package_name":"requests","ecosystem":"pypi","requirements":"==2.28.1","direct":true,"kind":"development","optional":false},{"id":7662291870,"package_name":"responses","ecosystem":"pypi","requirements":"==0.18.0","direct":true,"kind":"development","optional":false},{"id":7662291871,"package_name":"scikit-learn","ecosystem":"pypi","requirements":"==1.0.2","direct":true,"kind":"development","optional":false},{"id":7662291872,"package_name":"scipy","ecosystem":"pypi","requirements":"==1.7.3","direct":true,"kind":"development","optional":false},{"id":7662291873,"package_name":"segtok","ecosystem":"pypi","requirements":"==1.5.11","direct":true,"kind":"development","optional":false},{"id":7662291874,"package_name":"sentencepiece","ecosystem":"pypi","requirements":"==0.1.97","direct":true,"kind":"development","optional":false},{"id":7662291875,"package_name":"sentry-sdk","ecosystem":"pypi","requirements":"==1.10.1","direct":true,"kind":"development","optional":false},{"id":7662291876,"package_name":"setproctitle","ecosystem":"pypi","requirements":"==1.3.2","direct":true,"kind":"development","optional":false},{"id":7662291877,"package_name":"setuptools-scm","ecosystem":"pypi","requirements":"==6.4.2","direct":true,"kind":"development","optional":false},{"id":7662291878,"package_name":"setuptools","ecosystem":"pypi","requirements":"==62.6.0","direct":true,"kind":"development","optional":false},{"id":7662291879,"package_name":"shortuuid","ecosystem":"pypi","requirements":"==1.0.9","direct":true,"kind":"development","optional":false},{"id":7662291880,"package_name":"six","ecosystem":"pypi","requirements":"==1.16.0","direct":true,"kind":"development","optional":false},{"id":7662291881,"package_name":"smart-open","ecosystem":"pypi","requirements":"==6.2.0","direct":true,"kind":"development","optional":false},{"id":7662291882,"package_name":"smmap","ecosystem":"pypi","requirements":"==5.0.0","direct":true,"kind":"development","optional":false},{"id":7662291883,"package_name":"sqlitedict","ecosystem":"pypi","requirements":"==2.0.0","direct":true,"kind":"development","optional":false},{"id":7662291884,"package_name":"tabulate","ecosystem":"pypi","requirements":"==0.9.0","direct":true,"kind":"development","optional":false},{"id":7662291885,"package_name":"threadpoolctl","ecosystem":"pypi","requirements":"==3.1.0","direct":true,"kind":"development","optional":false},{"id":7662291886,"package_name":"tokenizers","ecosystem":"pypi","requirements":"==0.13.1","direct":true,"kind":"development","optional":false},{"id":7662291887,"package_name":"toml","ecosystem":"pypi","requirements":"==0.10.2","direct":true,"kind":"development","optional":false},{"id":7662291888,"package_name":"tomli","ecosystem":"pypi","requirements":"==2.0.1","direct":true,"kind":"development","optional":false},{"id":7662291889,"package_name":"torch","ecosystem":"pypi","requirements":"==1.9.0","direct":true,"kind":"development","optional":false},{"id":7662291890,"package_name":"tqdm","ecosystem":"pypi","requirements":"==4.64.1","direct":true,"kind":"development","optional":false},{"id":7662291891,"package_name":"transformers","ecosystem":"pypi","requirements":"==4.23.1","direct":true,"kind":"development","optional":false},{"id":7662291892,"package_name":"typed-ast","ecosystem":"pypi","requirements":"==1.5.4","direct":true,"kind":"development","optional":false},{"id":7662291893,"package_name":"typing-extensions","ecosystem":"pypi","requirements":"==4.4.0","direct":true,"kind":"development","optional":false},{"id":7662291894,"package_name":"urllib3","ecosystem":"pypi","requirements":"==1.26.12","direct":true,"kind":"development","optional":false},{"id":7662291895,"package_name":"wandb","ecosystem":"pypi","requirements":"==0.13.4","direct":true,"kind":"development","optional":false},{"id":7662291896,"package_name":"wheel","ecosystem":"pypi","requirements":"==0.37.1","direct":true,"kind":"development","optional":false},{"id":7662291897,"package_name":"wikipedia2vec","ecosystem":"pypi","requirements":"==1.0.5","direct":true,"kind":"development","optional":false},{"id":7662291898,"package_name":"win32-setctime","ecosystem":"pypi","requirements":"==1.1.0","direct":true,"kind":"development","optional":false},{"id":7662291899,"package_name":"wrapt","ecosystem":"pypi","requirements":"==1.14.1","direct":true,"kind":"development","optional":false},{"id":7662291900,"package_name":"xxhash","ecosystem":"pypi","requirements":"==3.1.0","direct":true,"kind":"development","optional":false},{"id":7662291901,"package_name":"yarl","ecosystem":"pypi","requirements":"==1.8.1","direct":true,"kind":"development","optional":false},{"id":7662291902,"package_name":"zipp","ecosystem":"pypi","requirements":"==3.10.0","direct":true,"kind":"development","optional":false}]},{"ecosystem":"pypi","filepath":"pyproject.toml","sha":null,"kind":"manifest","created_at":"2024-11-11T03:12:57.253Z","updated_at":"2024-11-11T03:12:57.253Z","repository_link":"https://github.com/bigscience-workshop/metadata/blob/master/pyproject.toml","dependencies":[]},{"ecosystem":"pypi","filepath":"setup.py","sha":null,"kind":"manifest","created_at":"2024-11-11T03:12:57.341Z","updated_at":"2024-11-11T03:12:57.341Z","repository_link":"https://github.com/bigscience-workshop/metadata/blob/master/setup.py","dependencies":[]}],"score":null,"created_at":"2025-09-09T00:23:01.103Z","updated_at":"2025-10-07T08:36:45.076Z","avatar_url":"https://github.com/bigscience-workshop.png","language":"Python","category":null,"sub_category":null,"monthly_downloads":0,"funding_links":[],"readme_doi_urls":[],"works":{},"citation_counts":{},"total_citations":0,"keywords_from_contributors":[],"project_url":"https://science.ecosyste.ms/api/v1/projects/146795","html_url":"https://science.ecosyste.ms/projects/146795"}