{"id":55904,"name":"text-dedup","description":"All-in-one text de-duplication","url":"https://github.com/chenghaomou/text-dedup","last_synced_at":"2025-09-05T14:03:44.628Z","repository":{"id":37245633,"uuid":"347428086","full_name":"ChenghaoMou/text-dedup","owner":"ChenghaoMou","description":"All-in-one text de-duplication","archived":false,"fork":false,"pushed_at":"2025-07-26T08:55:25.000Z","size":6335,"stargazers_count":710,"open_issues_count":2,"forks_count":74,"subscribers_count":3,"default_branch":"main","last_synced_at":"2025-08-29T04:26:51.246Z","etag":null,"topics":["data-processing","de-duplication","nlp","text-processing"],"latest_commit_sha":null,"homepage":"","language":"Python","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"apache-2.0","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/ChenghaoMou.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":"LICENSE","code_of_conduct":null,"threat_model":null,"audit":null,"citation":"CITATION.bib","codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null,"zenodo":null}},"created_at":"2021-03-13T17:00:44.000Z","updated_at":"2025-08-28T00:08:58.000Z","dependencies_parsed_at":"2023-10-13T13:26:13.863Z","dependency_job_id":"9404e748-a6f4-42d3-bd76-fcae5c5b8319","html_url":"https://github.com/ChenghaoMou/text-dedup","commit_stats":null,"previous_names":[],"tags_count":17,"template":false,"template_full_name":null,"purl":"pkg:github/ChenghaoMou/text-dedup","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/ChenghaoMou","download_url":"https://codeload.github.com/ChenghaoMou/text-dedup/tar.gz/refs/heads/main","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/sbom","scorecard":null,"host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":273768127,"owners_count":25164464,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","status":"online","status_checked_at":"2025-09-05T02:00:09.113Z","response_time":402,"last_error":null,"robots_txt_status":"success","robots_txt_updated_at":"2025-07-24T06:49:26.215Z","robots_txt_url":"https://github.com/robots.txt","online":true,"can_crawl_api":true,"host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"owner":null,"packages":[{"id":2944260,"name":"text-dedup","ecosystem":"pypi","description":null,"homepage":null,"licenses":"Apache 2.0","normalized_licenses":["Apache-2.0"],"repository_url":"https://github.com/chenghaomou/text-dedup","keywords_array":[],"namespace":null,"versions_count":24,"first_release_published_at":"2021-03-14T20:46:03.000Z","latest_release_published_at":"2024-04-17T20:14:00.000Z","latest_release_number":"0.4.0","last_synced_at":"2025-08-29T06:50:48.738Z","created_at":"2022-04-10T12:49:14.924Z","updated_at":"2025-08-29T06:58:46.152Z","registry_url":"https://pypi.org/project/text-dedup/","install_command":"pip install text-dedup --index-url https://pypi.org/simple","documentation_url":"https://text-dedup.readthedocs.io/","metadata":{"funding":null,"documentation":null,"classifiers":["License :: Other/Proprietary License","Programming Language :: Python :: 3","Programming Language :: Python :: 3.10","Programming Language :: Python :: 3.11","Programming Language :: Python :: 3.12"],"normalized_name":"text-dedup","project_status":null},"repo_metadata":{"id":37245633,"uuid":"347428086","full_name":"ChenghaoMou/text-dedup","owner":"ChenghaoMou","description":"All-in-one text de-duplication","archived":false,"fork":false,"pushed_at":"2025-07-26T08:55:25.000Z","size":6335,"stargazers_count":710,"open_issues_count":2,"forks_count":74,"subscribers_count":3,"default_branch":"main","last_synced_at":"2025-08-29T04:26:51.246Z","etag":null,"topics":["data-processing","de-duplication","nlp","text-processing"],"latest_commit_sha":null,"homepage":"","language":"Python","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"apache-2.0","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/ChenghaoMou.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":"LICENSE","code_of_conduct":null,"threat_model":null,"audit":null,"citation":"CITATION.bib","codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null,"zenodo":null}},"created_at":"2021-03-13T17:00:44.000Z","updated_at":"2025-08-28T00:08:58.000Z","dependencies_parsed_at":"2023-10-13T13:26:13.863Z","dependency_job_id":"9404e748-a6f4-42d3-bd76-fcae5c5b8319","html_url":"https://github.com/ChenghaoMou/text-dedup","commit_stats":null,"previous_names":[],"tags_count":17,"template":false,"template_full_name":null,"purl":"pkg:github/ChenghaoMou/text-dedup","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/ChenghaoMou","download_url":"https://codeload.github.com/ChenghaoMou/text-dedup/tar.gz/refs/heads/main","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/sbom","scorecard":null,"host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":272646699,"owners_count":24969678,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","status":"online","status_checked_at":"2025-08-29T02:00:10.610Z","response_time":87,"last_error":null,"robots_txt_status":"success","robots_txt_updated_at":"2025-07-24T06:49:26.215Z","robots_txt_url":"https://github.com/robots.txt","online":true,"can_crawl_api":true,"host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"},"owner_record":{"login":"ChenghaoMou","name":"Chenghao Mou","uuid":"32014649","kind":"user","description":"NLP/AI\r\n","email":"","website":"https://sleeplessindebugging.blog/","location":"Ireland","twitter":null,"company":null,"icon_url":"https://avatars.githubusercontent.com/u/32014649?u=bf7b28ce77de4c43a90023474dd208c971e8a872\u0026v=4","repositories_count":32,"last_synced_at":"2025-08-29T01:08:28.196Z","metadata":{"has_sponsors_listing":true},"html_url":"https://github.com/ChenghaoMou","funding_links":["https://github.com/sponsors/ChenghaoMou"],"total_stars":623,"followers":128,"following":252,"created_at":"2022-11-14T19:51:49.742Z","updated_at":"2025-08-29T01:08:28.196Z","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/ChenghaoMou","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/ChenghaoMou/repositories"},"tags":[{"name":"0.4.0","sha":"34dff553b8a1d2fd3b784aed80ff76eb35b4c8cf","kind":"tag","published_at":"2024-04-17T20:12:44.000Z","download_url":"https://codeload.github.com/ChenghaoMou/text-dedup/tar.gz/0.4.0","html_url":"https://github.com/ChenghaoMou/text-dedup/releases/tag/0.4.0","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/ChenghaoMou/text-dedup@0.4.0","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.4.0","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.4.0/manifests"},{"name":"2023.09.20","sha":"f565d158a38835f337b478db38e706b7fb235600","kind":"tag","published_at":"2023-09-20T21:18:02.000Z","download_url":"https://codeload.github.com/ChenghaoMou/text-dedup/tar.gz/2023.09.20","html_url":"https://github.com/ChenghaoMou/text-dedup/releases/tag/2023.09.20","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/ChenghaoMou/text-dedup@2023.09.20","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/2023.09.20","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/2023.09.20/manifests"},{"name":"0.3.1","sha":"926d56a01d678162af4bb93f51ee4d00f7a04aa3","kind":"tag","published_at":"2023-03-25T20:01:39.000Z","download_url":"https://codeload.github.com/ChenghaoMou/text-dedup/tar.gz/0.3.1","html_url":"https://github.com/ChenghaoMou/text-dedup/releases/tag/0.3.1","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/ChenghaoMou/text-dedup@0.3.1","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.3.1","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.3.1/manifests"},{"name":"0.3.0","sha":"8ef91c6904ed90cb084582ecc6c8b0656df2d3f9","kind":"tag","published_at":"2022-11-05T23:01:16.000Z","download_url":"https://codeload.github.com/ChenghaoMou/text-dedup/tar.gz/0.3.0","html_url":"https://github.com/ChenghaoMou/text-dedup/releases/tag/0.3.0","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/ChenghaoMou/text-dedup@0.3.0","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.3.0","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.3.0/manifests"},{"name":"0.2.1","sha":"a43d73958dac17de8ef5587b407edeb7ba81080d","kind":"tag","published_at":"2022-09-29T01:38:15.000Z","download_url":"https://codeload.github.com/ChenghaoMou/text-dedup/tar.gz/0.2.1","html_url":"https://github.com/ChenghaoMou/text-dedup/releases/tag/0.2.1","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/ChenghaoMou/text-dedup@0.2.1","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.2.1","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.2.1/manifests"},{"name":"0.2.0","sha":"49efc3363023d25431d690c41a07dc7ec91e3f3b","kind":"tag","published_at":"2022-09-24T03:54:17.000Z","download_url":"https://codeload.github.com/ChenghaoMou/text-dedup/tar.gz/0.2.0","html_url":"https://github.com/ChenghaoMou/text-dedup/releases/tag/0.2.0","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/ChenghaoMou/text-dedup@0.2.0","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.2.0","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.2.0/manifests"},{"name":"0.1.1","sha":"4a49424e6fe5ba50d8288406330aef97139eb0e0","kind":"tag","published_at":"2022-09-04T17:56:21.000Z","download_url":"https://codeload.github.com/ChenghaoMou/text-dedup/tar.gz/0.1.1","html_url":"https://github.com/ChenghaoMou/text-dedup/releases/tag/0.1.1","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/ChenghaoMou/text-dedup@0.1.1","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.1.1","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.1.1/manifests"},{"name":"0.1.0","sha":"682dd1d611e1085eadb1cac290691e1b6c3fc94f","kind":"tag","published_at":"2022-08-27T20:13:24.000Z","download_url":"https://codeload.github.com/ChenghaoMou/text-dedup/tar.gz/0.1.0","html_url":"https://github.com/ChenghaoMou/text-dedup/releases/tag/0.1.0","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/ChenghaoMou/text-dedup@0.1.0","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.1.0","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.1.0/manifests"},{"name":"0.0.18","sha":"536e9102df2a1acc8c355ac709b579406952c4e5","kind":"tag","published_at":"2022-06-20T21:40:53.000Z","download_url":"https://codeload.github.com/ChenghaoMou/text-dedup/tar.gz/0.0.18","html_url":"https://github.com/ChenghaoMou/text-dedup/releases/tag/0.0.18","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/ChenghaoMou/text-dedup@0.0.18","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.0.18","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.0.18/manifests"},{"name":"0.0.17","sha":"94c6df28eec9243277cbc98ed1fb177efcd15f90","kind":"tag","published_at":"2022-06-15T03:04:49.000Z","download_url":"https://codeload.github.com/ChenghaoMou/text-dedup/tar.gz/0.0.17","html_url":"https://github.com/ChenghaoMou/text-dedup/releases/tag/0.0.17","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/ChenghaoMou/text-dedup@0.0.17","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.0.17","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.0.17/manifests"},{"name":"0.0.16","sha":"c585de4f57a7232012b8083cdb726b8409ed07af","kind":"tag","published_at":"2022-06-14T03:17:02.000Z","download_url":"https://codeload.github.com/ChenghaoMou/text-dedup/tar.gz/0.0.16","html_url":"https://github.com/ChenghaoMou/text-dedup/releases/tag/0.0.16","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/ChenghaoMou/text-dedup@0.0.16","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.0.16","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.0.16/manifests"},{"name":"0.0.15","sha":"8c2242e85a7be32b0998a3e1becd69a35940a2ce","kind":"tag","published_at":"2022-05-29T20:41:40.000Z","download_url":"https://codeload.github.com/ChenghaoMou/text-dedup/tar.gz/0.0.15","html_url":"https://github.com/ChenghaoMou/text-dedup/releases/tag/0.0.15","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/ChenghaoMou/text-dedup@0.0.15","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.0.15","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.0.15/manifests"},{"name":"0.0.14","sha":"8c2242e85a7be32b0998a3e1becd69a35940a2ce","kind":"tag","published_at":"2022-05-29T02:05:28.000Z","download_url":"https://codeload.github.com/ChenghaoMou/text-dedup/tar.gz/0.0.14","html_url":"https://github.com/ChenghaoMou/text-dedup/releases/tag/0.0.14","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/ChenghaoMou/text-dedup@0.0.14","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.0.14","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.0.14/manifests"},{"name":"list","sha":"8c2242e85a7be32b0998a3e1becd69a35940a2ce","kind":"commit","published_at":"2022-05-29T02:03:53.000Z","download_url":"https://codeload.github.com/ChenghaoMou/text-dedup/tar.gz/list","html_url":"https://github.com/ChenghaoMou/text-dedup/releases/tag/list","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/ChenghaoMou/text-dedup@list","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/list","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/list/manifests"},{"name":"0.0.13","sha":"24aa9b26a31b5ed39909c2fe09d7fda24b4729e7","kind":"tag","published_at":"2022-04-02T20:56:43.000Z","download_url":"https://codeload.github.com/ChenghaoMou/text-dedup/tar.gz/0.0.13","html_url":"https://github.com/ChenghaoMou/text-dedup/releases/tag/0.0.13","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/ChenghaoMou/text-dedup@0.0.13","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.0.13","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.0.13/manifests"},{"name":"0.0.11","sha":"feede7e03ab979465ef1ef040a886c7dff401d69","kind":"tag","published_at":"2021-07-24T18:52:55.000Z","download_url":"https://codeload.github.com/ChenghaoMou/text-dedup/tar.gz/0.0.11","html_url":"https://github.com/ChenghaoMou/text-dedup/releases/tag/0.0.11","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/ChenghaoMou/text-dedup@0.0.11","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.0.11","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.0.11/manifests"},{"name":"0.0.10","sha":"b13b5f6c2c5fb2115bf222973a0d0bdf5193b975","kind":"tag","published_at":"2021-07-24T18:13:31.000Z","download_url":"https://codeload.github.com/ChenghaoMou/text-dedup/tar.gz/0.0.10","html_url":"https://github.com/ChenghaoMou/text-dedup/releases/tag/0.0.10","dependencies_parsed_at":null,"dependency_job_id":null,"purl":"pkg:github/ChenghaoMou/text-dedup@0.0.10","tag_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.0.10","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/tags/0.0.10/manifests"}]},"repo_metadata_updated_at":"2025-08-29T06:58:46.151Z","dependent_packages_count":0,"downloads":449,"downloads_period":"last-month","dependent_repos_count":2,"rankings":{"downloads":19.930200982923143,"dependent_repos_count":11.583370469328855,"dependent_packages_count":10.038423948696664,"stargazers_count":null,"forks_count":null,"docker_downloads_count":null,"average":13.850665133649555},"purl":"pkg:pypi/text-dedup","advisories":[],"docker_usage_url":"https://docker.ecosyste.ms/usage/pypi/text-dedup","docker_dependents_count":null,"docker_downloads_count":null,"usage_url":"https://repos.ecosyste.ms/usage/pypi/text-dedup","dependent_repositories_url":"https://repos.ecosyste.ms/api/v1/usage/pypi/text-dedup/dependencies","status":null,"funding_links":["https://github.com/sponsors/ChenghaoMou"],"critical":null,"issue_metadata":{"last_synced_at":"2024-02-27T03:18:11.154Z","issues_count":5,"pull_requests_count":21,"avg_time_to_close_issue":53619.75,"avg_time_to_close_pull_request":91285.15,"issues_closed_count":4,"pull_requests_closed_count":20,"pull_request_authors_count":2,"issue_authors_count":4,"avg_comments_per_issue":3.2,"avg_comments_per_pull_request":0.19047619047619047,"merged_pull_requests_count":18,"bot_issues_count":0,"bot_pull_requests_count":0,"past_year_issues_count":3,"past_year_pull_requests_count":5,"past_year_avg_time_to_close_issue":32627.333333333332,"past_year_avg_time_to_close_pull_request":71.0,"past_year_issues_closed_count":3,"past_year_pull_requests_closed_count":4,"past_year_pull_request_authors_count":2,"past_year_issue_authors_count":2,"past_year_avg_comments_per_issue":3.6666666666666665,"past_year_avg_comments_per_pull_request":0.6,"past_year_bot_issues_count":0,"past_year_bot_pull_requests_count":0,"past_year_merged_pull_requests_count":4,"issues_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/serega%2Fgaoya/issues","maintainers":[{"login":"serega","count":21,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/serega"}],"active_maintainers":[{"login":"serega","count":5,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/serega"}]},"versions_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/packages/text-dedup/versions","version_numbers_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/packages/text-dedup/version_numbers","dependent_packages_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/packages/text-dedup/dependent_packages","related_packages_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/packages/text-dedup/related_packages","maintainers":[{"uuid":"Maxen1996","login":"Maxen1996","name":null,"email":null,"url":null,"packages_count":14,"html_url":"https://pypi.org/user/Maxen1996/","role":null,"created_at":"2022-12-01T06:16:37.449Z","updated_at":"2022-12-01T06:16:37.449Z","packages_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/maintainers/Maxen1996/packages"}],"registry":{"name":"pypi.org","url":"https://pypi.org","ecosystem":"pypi","default":true,"packages_count":725158,"maintainers_count":308368,"namespaces_count":0,"keywords_count":238006,"github":"pypi","metadata":{"funded_packages_count":50519},"icon_url":"https://github.com/pypi.png","created_at":"2022-04-04T15:19:23.364Z","updated_at":"2025-09-05T05:40:58.860Z","packages_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/packages","maintainers_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/maintainers","namespaces_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/namespaces"}}],"commits":{"id":5818511,"full_name":"chenghaomou/text-dedup","default_branch":"master","committers":null,"total_commits":null,"total_committers":null,"total_bot_commits":null,"total_bot_committers":null,"mean_commits":null,"dds":null,"past_year_committers":null,"past_year_total_commits":null,"past_year_total_committers":null,"past_year_total_bot_commits":null,"past_year_total_bot_committers":null,"past_year_mean_commits":null,"past_year_dds":null,"last_synced_at":null,"last_synced_commit":null,"created_at":"2024-11-15T09:51:08.554Z","updated_at":"2024-11-15T09:51:08.554Z","commits_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub/repositories/chenghaomou%2Ftext-dedup/commits","host":{"name":"GitHub","url":"https://github.com","kind":"github","last_synced_at":"2025-09-05T00:00:10.343Z","repositories_count":5480019,"commits_count":853389012,"contributors_count":31098138,"owners_count":906558,"icon_url":"https://github.com/github.png","host_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub/repositories"}},"issues_stats":{"full_name":"ChenghaoMou/text-dedup","html_url":"https://github.com/ChenghaoMou/text-dedup","last_synced_at":"2025-08-31T13:06:20.479Z","status":null,"issues_count":16,"pull_requests_count":4,"avg_time_to_close_issue":796129.7333333333,"avg_time_to_close_pull_request":2952765.0,"issues_closed_count":15,"pull_requests_closed_count":2,"pull_request_authors_count":2,"issue_authors_count":4,"avg_comments_per_issue":0.5625,"avg_comments_per_pull_request":0.5,"merged_pull_requests_count":1,"bot_issues_count":12,"bot_pull_requests_count":0,"past_year_issues_count":16,"past_year_pull_requests_count":4,"past_year_avg_time_to_close_issue":796129.7333333333,"past_year_avg_time_to_close_pull_request":2952765.0,"past_year_issues_closed_count":15,"past_year_pull_requests_closed_count":2,"past_year_pull_request_authors_count":2,"past_year_issue_authors_count":4,"past_year_avg_comments_per_issue":0.5625,"past_year_avg_comments_per_pull_request":0.5,"past_year_bot_issues_count":12,"past_year_bot_pull_requests_count":0,"past_year_merged_pull_requests_count":1,"created_at":"2025-08-29T11:56:24.322Z","updated_at":"2025-09-03T05:19:57.216Z","repository_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup","issues_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/ChenghaoMou%2Ftext-dedup/issues","issue_labels_count":{"no-issue-activity":22},"pull_request_labels_count":{"no-issue-activity":2,"dependencies":1,"no-pr-activity":1},"issue_author_associations_count":{"NONE":44,"OWNER":1},"pull_request_author_associations_count":{"OWNER":4,"NONE":4,"CONTRIBUTOR":3},"issue_authors":{"linear[bot]":17,"Dodero10":3,"mmpouya":2,"Jason3900":2,"bowspider-man":2,"alielfilali01":1,"hancheolcho":1,"MiladMolazadeh":1,"maoxiangyi":1,"311dada":1,"cjmp1":1,"wuodar":1,"simplew2011":1,"XChen-Zero":1,"siebeniris":1,"mohamedlekarim":1,"kimcando":1,"varuy322":1,"Leoooooo123":1,"programmerLY":1,"ChenghaoMou":1,"HungHoangDinh":1,"Yang-QW":1,"prikmm":1},"pull_request_authors":{"ChenghaoMou":4,"louisowen6":2,"qxuanson":1,"chris-ha458":1,"mohamedlekarim":1,"dependabot[bot]":1,"hahmad2008":1},"host":{"name":"GitHub","url":"https://github.com","kind":"github","last_synced_at":"2025-09-05T00:00:10.444Z","repositories_count":10098650,"issues_count":31447165,"pull_requests_count":97330651,"authors_count":10702032,"icon_url":"https://github.com/github.png","host_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories","owners_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/owners","authors_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors"},"past_year_issue_labels_count":{"no-issue-activity":2},"past_year_pull_request_labels_count":{"no-issue-activity":1},"past_year_issue_author_associations_count":{"NONE":19},"past_year_pull_request_author_associations_count":{"OWNER":3,"NONE":2},"past_year_issue_authors":{"linear[bot]":12,"bowspider-man":2,"mmpouya":2,"mohamedlekarim":1,"varuy322":1,"XChen-Zero":1},"past_year_pull_request_authors":{"ChenghaoMou":3,"qxuanson":1,"mohamedlekarim":1},"maintainers":[{"login":"ChenghaoMou","count":5,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/ChenghaoMou"}],"active_maintainers":[{"login":"ChenghaoMou","count":3,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/ChenghaoMou"}]},"events":{"total":{"IssuesEvent":45,"WatchEvent":104,"IssueCommentEvent":17,"PushEvent":5,"PullRequestEvent":4,"ForkEvent":5,"CreateEvent":3},"last_year":{"IssuesEvent":45,"WatchEvent":104,"IssueCommentEvent":17,"PushEvent":5,"PullRequestEvent":4,"ForkEvent":5,"CreateEvent":3}},"keywords":["data-processing","de-duplication","nlp","text-processing"],"dependencies":null,"score":null,"created_at":"2025-09-04T15:51:31.997Z","updated_at":"2025-10-07T08:22:06.540Z","avatar_url":"https://github.com/ChenghaoMou.png","language":"Python","category":null,"sub_category":null,"monthly_downloads":449,"funding_links":[],"readme_doi_urls":["https://doi.org/10.5281/zenodo.8364980"],"works":{},"citation_counts":{},"total_citations":0,"keywords_from_contributors":[],"project_url":"https://science.ecosyste.ms/api/v1/projects/55904","html_url":"https://science.ecosyste.ms/projects/55904","bibtex_url":"https://science.ecosyste.ms/projects/55904/export.bibtex","apalike_url":"https://science.ecosyste.ms/projects/55904/export.apalike"}