{"id":182944,"name":null,"description":"Cleaning tool for web scraped text","url":"https://github.com/citiususc/pyplexity","last_synced_at":"2025-09-10T01:35:03.292Z","repository":{"id":43462948,"uuid":"462290971","full_name":"citiususc/pyplexity","owner":"citiususc","description":"Cleaning tool for web scraped text","archived":false,"fork":false,"pushed_at":"2023-06-07T09:59:20.000Z","size":269,"stargazers_count":38,"open_issues_count":2,"forks_count":3,"subscribers_count":3,"default_branch":"main","last_synced_at":"2025-07-26T11:38:39.844Z","etag":null,"topics":["information-retrieval","nlp","python","scraping","tag-cleaning"],"latest_commit_sha":null,"homepage":"","language":"Python","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"gpl-3.0","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/citiususc.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":"LICENSE","code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null}},"created_at":"2022-02-22T12:37:09.000Z","updated_at":"2025-05-10T06:54:51.000Z","dependencies_parsed_at":"2024-12-02T02:49:44.063Z","dependency_job_id":null,"html_url":"https://github.com/citiususc/pyplexity","commit_stats":{"total_commits":25,"total_committers":6,"mean_commits":4.166666666666667,"dds":0.6799999999999999,"last_synced_commit":"5348adda1006ff5f2c6bd740afacb9aaaad006fd"},"previous_names":[],"tags_count":0,"template":false,"template_full_name":null,"purl":"pkg:github/citiususc/pyplexity","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/citiususc%2Fpyplexity","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/citiususc%2Fpyplexity/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/citiususc%2Fpyplexity/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/citiususc%2Fpyplexity/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/citiususc","download_url":"https://codeload.github.com/citiususc/pyplexity/tar.gz/refs/heads/main","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/citiususc%2Fpyplexity/sbom","scorecard":{"id":283535,"data":{"date":"2025-08-11","repo":{"name":"github.com/citiususc/pyplexity","commit":"7d3ebd5a84b835ec513874494fd4e91393b35ab9"},"scorecard":{"version":"v5.2.1-40-gf6ed084d","commit":"f6ed084d17c9236477efd66e5b258b9d4cc7b389"},"score":2.1,"checks":[{"name":"Code-Review","score":0,"reason":"Found 0/27 approved changesets -- score normalized to 0","details":null,"documentation":{"short":"Determines if the project requires human code review before pull requests (aka merge requests) are merged.","url":"https://github.com/ossf/scorecard/blob/f6ed084d17c9236477efd66e5b258b9d4cc7b389/docs/checks.md#code-review"}},{"name":"Packaging","score":-1,"reason":"packaging workflow not detected","details":["Warn: no GitHub/GitLab publishing workflow detected."],"documentation":{"short":"Determines if the project is published as a package that others can easily download, install, easily update, and uninstall.","url":"https://github.com/ossf/scorecard/blob/f6ed084d17c9236477efd66e5b258b9d4cc7b389/docs/checks.md#packaging"}},{"name":"Dangerous-Workflow","score":-1,"reason":"no workflows found","details":null,"documentation":{"short":"Determines if the project's GitHub Action workflows avoid dangerous patterns.","url":"https://github.com/ossf/scorecard/blob/f6ed084d17c9236477efd66e5b258b9d4cc7b389/docs/checks.md#dangerous-workflow"}},{"name":"Token-Permissions","score":-1,"reason":"No tokens found","details":null,"documentation":{"short":"Determines if the project's workflows follow the principle of least privilege.","url":"https://github.com/ossf/scorecard/blob/f6ed084d17c9236477efd66e5b258b9d4cc7b389/docs/checks.md#token-permissions"}},{"name":"CII-Best-Practices","score":0,"reason":"no effort to earn an OpenSSF best practices badge detected","details":null,"documentation":{"short":"Determines if the project has an OpenSSF (formerly CII) Best Practices Badge.","url":"https://github.com/ossf/scorecard/blob/f6ed084d17c9236477efd66e5b258b9d4cc7b389/docs/checks.md#cii-best-practices"}},{"name":"Pinned-Dependencies","score":-1,"reason":"no dependencies found","details":null,"documentation":{"short":"Determines if the project has declared and pinned the dependencies of its build process.","url":"https://github.com/ossf/scorecard/blob/f6ed084d17c9236477efd66e5b258b9d4cc7b389/docs/checks.md#pinned-dependencies"}},{"name":"Maintained","score":0,"reason":"0 commit(s) and 0 issue activity found in the last 90 days -- score normalized to 0","details":null,"documentation":{"short":"Determines if the project is \"actively maintained\".","url":"https://github.com/ossf/scorecard/blob/f6ed084d17c9236477efd66e5b258b9d4cc7b389/docs/checks.md#maintained"}},{"name":"Vulnerabilities","score":10,"reason":"0 existing vulnerabilities detected","details":null,"documentation":{"short":"Determines if the project has open, known unfixed vulnerabilities.","url":"https://github.com/ossf/scorecard/blob/f6ed084d17c9236477efd66e5b258b9d4cc7b389/docs/checks.md#vulnerabilities"}},{"name":"Security-Policy","score":0,"reason":"security policy file not detected","details":["Warn: no security policy file detected","Warn: no security file to analyze","Warn: no security file to analyze","Warn: no security file to analyze"],"documentation":{"short":"Determines if the project has published a security policy.","url":"https://github.com/ossf/scorecard/blob/f6ed084d17c9236477efd66e5b258b9d4cc7b389/docs/checks.md#security-policy"}},{"name":"Fuzzing","score":0,"reason":"project is not fuzzed","details":["Warn: no fuzzer integrations found"],"documentation":{"short":"Determines if the project uses fuzzing.","url":"https://github.com/ossf/scorecard/blob/f6ed084d17c9236477efd66e5b258b9d4cc7b389/docs/checks.md#fuzzing"}},{"name":"Signed-Releases","score":-1,"reason":"no releases found","details":null,"documentation":{"short":"Determines if the project cryptographically signs release artifacts.","url":"https://github.com/ossf/scorecard/blob/f6ed084d17c9236477efd66e5b258b9d4cc7b389/docs/checks.md#signed-releases"}},{"name":"Binary-Artifacts","score":3,"reason":"binaries present in source code","details":["Warn: binary detected: pyplexity/__pycache__/__init__.cpython-39.pyc:1","Warn: binary detected: pyplexity/__pycache__/__main__.cpython-39.pyc:1","Warn: binary detected: pyplexity/__pycache__/distributed_files_server.cpython-39.pyc:1","Warn: binary detected: pyplexity/__pycache__/perpl_model.cpython-39.pyc:1","Warn: binary detected: pyplexity/__pycache__/tag_remover.cpython-39.pyc:1","Warn: binary detected: pyplexity/dataset_processor/__pycache__/CustomWARCWriter.cpython-39.pyc:1","Warn: binary detected: pyplexity/dataset_processor/__pycache__/dataset_processor.cpython-39.pyc:1"],"documentation":{"short":"Determines if the project has generated executable (binary) artifacts in the source repository.","url":"https://github.com/ossf/scorecard/blob/f6ed084d17c9236477efd66e5b258b9d4cc7b389/docs/checks.md#binary-artifacts"}},{"name":"License","score":10,"reason":"license file detected","details":["Info: project has a license file: LICENSE:0","Info: FSF or OSI recognized license: GNU General Public License v3.0: LICENSE:0"],"documentation":{"short":"Determines if the project has defined a license.","url":"https://github.com/ossf/scorecard/blob/f6ed084d17c9236477efd66e5b258b9d4cc7b389/docs/checks.md#license"}},{"name":"Branch-Protection","score":0,"reason":"branch protection not enabled on development/release branches","details":["Warn: branch protection not enabled for branch 'main'"],"documentation":{"short":"Determines if the default and release branches are protected with GitHub's branch protection settings.","url":"https://github.com/ossf/scorecard/blob/f6ed084d17c9236477efd66e5b258b9d4cc7b389/docs/checks.md#branch-protection"}},{"name":"SAST","score":0,"reason":"SAST tool is not run on all commits -- score normalized to 0","details":["Warn: 0 commits out of 4 are checked with a SAST tool"],"documentation":{"short":"Determines if the project uses static code analysis.","url":"https://github.com/ossf/scorecard/blob/f6ed084d17c9236477efd66e5b258b9d4cc7b389/docs/checks.md#sast"}}]},"last_synced_at":"2025-08-17T16:36:04.692Z","repository_id":43462948,"created_at":"2025-08-17T16:36:04.693Z","updated_at":"2025-08-17T16:36:04.693Z"},"host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":274396494,"owners_count":25277393,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","status":"online","status_checked_at":"2025-09-09T02:00:10.223Z","response_time":80,"last_error":null,"robots_txt_status":"success","robots_txt_updated_at":"2025-07-24T06:49:26.215Z","robots_txt_url":"https://github.com/robots.txt","online":true,"can_crawl_api":true,"host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"owner":{"login":"citiususc","name":"CiTIUS","uuid":"5822373","kind":"organization","description":"Centro Singular de Investigación en Tecnoloxías Intelixenteas da Universidade de Santiago de Compostela","email":"citius@usc.es","website":"https://citius.gal","location":"Santiago de Compostela","twitter":"citiususc","company":null,"icon_url":"https://avatars.githubusercontent.com/u/5822373?v=4","repositories_count":49,"last_synced_at":"2024-04-16T09:45:39.099Z","metadata":{"has_sponsors_listing":false},"html_url":"https://github.com/citiususc","funding_links":[],"total_stars":1317,"followers":20,"following":0,"created_at":"2022-11-05T04:52:06.925Z","updated_at":"2024-04-16T09:45:52.727Z","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/citiususc","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/citiususc/repositories"},"packages":[{"id":2879722,"name":"pyplexity","ecosystem":"pypi","description":"Perplexity filter for documents and bulk HTML and WARC boilerplate removal.","homepage":"https://github.com/citiususc/pyplexity","licenses":"GPL-3.0-only","normalized_licenses":["GPL-3.0-only"],"repository_url":"https://github.com/citiususc/pyplexity","keywords_array":[],"namespace":null,"versions_count":18,"first_release_published_at":"2022-02-28T12:26:01.000Z","latest_release_published_at":"2023-06-07T09:18:39.000Z","latest_release_number":"0.2.12","last_synced_at":"2025-08-13T18:48:26.137Z","created_at":"2022-04-10T12:16:56.699Z","updated_at":"2025-08-13T18:48:26.137Z","registry_url":"https://pypi.org/project/pyplexity/","install_command":"pip install pyplexity --index-url https://pypi.org/simple","documentation_url":"https://pyplexity.readthedocs.io/","metadata":{"funding":null,"documentation":null,"classifiers":["License :: OSI Approved :: GNU General Public License v3 (GPLv3)","Programming Language :: Python :: 3","Programming Language :: Python :: 3.10","Programming Language :: Python :: 3.11","Programming Language :: Python :: 3.7","Programming Language :: Python :: 3.8","Programming Language :: Python :: 3.9"],"normalized_name":"pyplexity"},"repo_metadata":{"id":43462948,"uuid":"462290971","full_name":"citiususc/pyplexity","owner":"citiususc","description":"Cleaning tool for web scraped text","archived":false,"fork":false,"pushed_at":"2023-06-07T09:59:20.000Z","size":269,"stargazers_count":38,"open_issues_count":2,"forks_count":3,"subscribers_count":3,"default_branch":"main","last_synced_at":"2025-05-14T23:31:56.823Z","etag":null,"topics":["information-retrieval","nlp","python","scraping","tag-cleaning"],"latest_commit_sha":null,"homepage":"","language":"Python","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"gpl-3.0","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/citiususc.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":"LICENSE","code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null}},"created_at":"2022-02-22T12:37:09.000Z","updated_at":"2025-05-10T06:54:51.000Z","dependencies_parsed_at":"2024-12-02T02:49:44.063Z","dependency_job_id":null,"html_url":"https://github.com/citiususc/pyplexity","commit_stats":{"total_commits":25,"total_committers":6,"mean_commits":4.166666666666667,"dds":0.6799999999999999,"last_synced_commit":"5348adda1006ff5f2c6bd740afacb9aaaad006fd"},"previous_names":[],"tags_count":0,"template":false,"template_full_name":null,"purl":"pkg:github/citiususc/pyplexity","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/citiususc%2Fpyplexity","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/citiususc%2Fpyplexity/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/citiususc%2Fpyplexity/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/citiususc%2Fpyplexity/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/citiususc","download_url":"https://codeload.github.com/citiususc/pyplexity/tar.gz/refs/heads/main","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/citiususc%2Fpyplexity/sbom","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":262708058,"owners_count":23351536,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"},"owner_record":{"login":"citiususc","name":"CiTIUS","uuid":"5822373","kind":"organization","description":"Centro Singular de Investigación en Tecnoloxías Intelixenteas da Universidade de Santiago de Compostela","email":"citius@usc.es","website":"https://citius.gal","location":"Santiago de Compostela","twitter":"citiususc","company":null,"icon_url":"https://avatars.githubusercontent.com/u/5822373?v=4","repositories_count":49,"last_synced_at":"2024-04-16T09:45:39.099Z","metadata":{"has_sponsors_listing":false},"html_url":"https://github.com/citiususc","funding_links":[],"total_stars":1317,"followers":20,"following":0,"created_at":"2022-11-05T04:52:06.925Z","updated_at":"2024-04-16T09:45:52.727Z","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/citiususc","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/citiususc/repositories"},"tags":[]},"repo_metadata_updated_at":"2025-06-30T04:15:30.013Z","dependent_packages_count":0,"downloads":81196,"downloads_period":"last-month","dependent_repos_count":1,"rankings":{"downloads":16.208278679381003,"dependent_repos_count":21.778912670755105,"dependent_packages_count":9.966767819241568,"stargazers_count":11.146450856908665,"forks_count":22.654826388554824,"docker_downloads_count":null,"average":16.35104728296823},"purl":"pkg:pypi/pyplexity","advisories":[],"docker_usage_url":"https://docker.ecosyste.ms/usage/pypi/pyplexity","docker_dependents_count":null,"docker_downloads_count":null,"usage_url":"https://repos.ecosyste.ms/usage/pypi/pyplexity","dependent_repositories_url":"https://repos.ecosyste.ms/api/v1/usage/pypi/pyplexity/dependencies","status":null,"funding_links":[],"critical":null,"issue_metadata":{"last_synced_at":"2025-05-14T23:26:28.654Z","issues_count":2,"pull_requests_count":2,"avg_time_to_close_issue":null,"avg_time_to_close_pull_request":75.0,"issues_closed_count":0,"pull_requests_closed_count":2,"pull_request_authors_count":2,"issue_authors_count":2,"avg_comments_per_issue":0.0,"avg_comments_per_pull_request":0.0,"merged_pull_requests_count":2,"bot_issues_count":0,"bot_pull_requests_count":1,"past_year_issues_count":1,"past_year_pull_requests_count":0,"past_year_avg_time_to_close_issue":null,"past_year_avg_time_to_close_pull_request":null,"past_year_issues_closed_count":0,"past_year_pull_requests_closed_count":0,"past_year_pull_request_authors_count":0,"past_year_issue_authors_count":1,"past_year_avg_comments_per_issue":0.0,"past_year_avg_comments_per_pull_request":null,"past_year_bot_issues_count":0,"past_year_bot_pull_requests_count":0,"past_year_merged_pull_requests_count":0,"issues_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/citiususc%2Fpyplexity/issues","maintainers":[{"login":"MarcosFP97","count":1,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/MarcosFP97"}],"active_maintainers":[]},"versions_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/packages/pyplexity/versions","version_numbers_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/packages/pyplexity/version_numbers","dependent_packages_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/packages/pyplexity/dependent_packages","related_packages_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/packages/pyplexity/related_packages","maintainers":[{"uuid":"manueldeprada","login":"manueldeprada","name":null,"email":null,"url":null,"packages_count":2,"html_url":"https://pypi.org/user/manueldeprada/","role":null,"created_at":"2023-02-25T05:03:09.501Z","updated_at":"2023-02-25T05:03:09.501Z","packages_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/maintainers/manueldeprada/packages"},{"uuid":"MarcosFP97","login":"MarcosFP97","name":null,"email":null,"url":null,"packages_count":3,"html_url":"https://pypi.org/user/MarcosFP97/","role":null,"created_at":"2023-04-03T19:18:23.749Z","updated_at":"2023-04-03T19:18:23.749Z","packages_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/maintainers/MarcosFP97/packages"}],"registry":{"name":"pypi.org","url":"https://pypi.org","ecosystem":"pypi","default":true,"packages_count":726767,"maintainers_count":308892,"namespaces_count":0,"keywords_count":238369,"github":"pypi","metadata":{"funded_packages_count":50594},"icon_url":"https://github.com/pypi.png","created_at":"2022-04-04T15:19:23.364Z","updated_at":"2025-09-09T06:31:19.922Z","packages_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/packages","maintainers_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/maintainers","namespaces_url":"https://packages.ecosyste.ms/api/v1/registries/pypi.org/namespaces"}}],"commits":{"id":639680,"full_name":"citiususc/pyplexity","default_branch":"main","committers":[{"name":"Manuel de Prada Corral","email":"eu@manueldeprada.com","count":8},{"name":"MarcosFP97","email":"40762225+MarcosFP97@users.noreply.github.com","count":6},{"name":"Manuel de Prada","email":"6536835+manueldeprada@users.noreply.github.com","count":6},{"name":"Marcos Fernández Pichel","email":"marcosfernandez.pichel@usc.es","count":3},{"name":"dependabot[bot]","email":"49699333+dependabot[bot]@users.noreply.github.com","count":1},{"name":"Manuel de Prada Corral","email":"manueldeprada@gmail.com","count":1}],"total_commits":25,"total_committers":6,"total_bot_commits":1,"total_bot_committers":1,"mean_commits":4.166666666666667,"dds":0.6799999999999999,"past_year_committers":null,"past_year_total_commits":null,"past_year_total_committers":null,"past_year_total_bot_commits":null,"past_year_total_bot_committers":null,"past_year_mean_commits":null,"past_year_dds":null,"last_synced_at":"2023-03-19T04:55:41.697Z","last_synced_commit":"5348adda1006ff5f2c6bd740afacb9aaaad006fd","created_at":"2023-03-09T08:49:18.912Z","updated_at":"2023-09-19T17:31:09.447Z","commits_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub/repositories/citiususc%2Fpyplexity/commits","host":{"name":"GitHub","url":"https://github.com","kind":"github","last_synced_at":"2025-09-10T00:25:43.995Z","repositories_count":5541222,"commits_count":875769132,"contributors_count":32330363,"owners_count":919428,"icon_url":"https://github.com/github.png","host_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub/repositories"}},"issues_stats":{"full_name":"citiususc/pyplexity","html_url":"https://github.com/citiususc/pyplexity","last_synced_at":"2025-06-30T04:15:30.015Z","status":null,"issues_count":2,"pull_requests_count":2,"avg_time_to_close_issue":null,"avg_time_to_close_pull_request":75.0,"issues_closed_count":0,"pull_requests_closed_count":2,"pull_request_authors_count":2,"issue_authors_count":2,"avg_comments_per_issue":0.0,"avg_comments_per_pull_request":0.0,"merged_pull_requests_count":2,"bot_issues_count":0,"bot_pull_requests_count":1,"past_year_issues_count":1,"past_year_pull_requests_count":0,"past_year_avg_time_to_close_issue":null,"past_year_avg_time_to_close_pull_request":null,"past_year_issues_closed_count":0,"past_year_pull_requests_closed_count":0,"past_year_pull_request_authors_count":0,"past_year_issue_authors_count":1,"past_year_avg_comments_per_issue":0.0,"past_year_avg_comments_per_pull_request":null,"past_year_bot_issues_count":0,"past_year_bot_pull_requests_count":0,"past_year_merged_pull_requests_count":0,"created_at":"2023-05-14T21:42:03.631Z","updated_at":"2025-09-02T03:12:54.413Z","repository_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/citiususc%2Fpyplexity","issues_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/citiususc%2Fpyplexity/issues","issue_labels_count":{},"pull_request_labels_count":{"dependencies":1},"issue_author_associations_count":{"NONE":2},"pull_request_author_associations_count":{"MEMBER":1,"CONTRIBUTOR":1},"issue_authors":{"Xiaoshu-Zhao":1,"johnnyjana730":1},"pull_request_authors":{"MarcosFP97":1,"dependabot[bot]":1},"host":{"name":"GitHub","url":"https://github.com","kind":"github","last_synced_at":"2025-09-02T00:00:07.986Z","repositories_count":10021777,"issues_count":30401953,"pull_requests_count":90051100,"authors_count":10269412,"icon_url":"https://github.com/github.png","host_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories","owners_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/owners","authors_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors"},"past_year_issue_labels_count":{},"past_year_pull_request_labels_count":{},"past_year_issue_author_associations_count":{},"past_year_pull_request_author_associations_count":{},"past_year_issue_authors":{},"past_year_pull_request_authors":{},"maintainers":[{"login":"MarcosFP97","count":1,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/MarcosFP97"}],"active_maintainers":[]},"events":{"total":{},"last_year":{}},"keywords":["information-retrieval","nlp","python","scraping","tag-cleaning"],"dependencies":[{"ecosystem":"pypi","filepath":"pyproject.toml","sha":null,"kind":"manifest","created_at":"2022-09-23T05:22:06.540Z","updated_at":"2022-09-23T05:22:06.540Z","repository_link":"https://github.com/citiususc/pyplexity/blob/main/pyproject.toml","dependencies":[{"id":5930441317,"package_name":"python","ecosystem":"pypi","requirements":"^3.6.1","direct":true,"kind":"runtime","optional":false},{"id":5930441318,"package_name":"typer","ecosystem":"pypi","requirements":"^0.4.0","direct":true,"kind":"runtime","optional":false},{"id":5930441319,"package_name":"Flask","ecosystem":"pypi","requirements":"^2.0.2","direct":true,"kind":"runtime","optional":false},{"id":5930441320,"package_name":"nltk","ecosystem":"pypi","requirements":"^3.6.7","direct":true,"kind":"runtime","optional":false},{"id":5930441321,"package_name":"pandas","ecosystem":"pypi","requirements":"^1.1.5","direct":true,"kind":"runtime","optional":false},{"id":5930441322,"package_name":"storable","ecosystem":"pypi","requirements":"^1.2.4","direct":true,"kind":"runtime","optional":false},{"id":5930441323,"package_name":"memory-tempfile","ecosystem":"pypi","requirements":"^2.2.3","direct":true,"kind":"runtime","optional":false},{"id":5930441324,"package_name":"warcio","ecosystem":"pypi","requirements":"^1.7.4","direct":true,"kind":"runtime","optional":false},{"id":5930441325,"package_name":"html5lib","ecosystem":"pypi","requirements":"^1.1","direct":true,"kind":"runtime","optional":false},{"id":5930441326,"package_name":"lxml","ecosystem":"pypi","requirements":"^4.7.1","direct":true,"kind":"runtime","optional":false},{"id":5930441327,"package_name":"cached-path","ecosystem":"pypi","requirements":"^1.0.2","direct":true,"kind":"runtime","optional":false},{"id":5930441328,"package_name":"pytest","ecosystem":"pypi","requirements":"^5.2","direct":true,"kind":"develop","optional":false}]},{"ecosystem":"pypi","filepath":"setup.py","sha":null,"kind":"manifest","created_at":"2024-12-02T02:49:42.886Z","updated_at":"2024-12-02T02:49:42.886Z","repository_link":"https://github.com/citiususc/pyplexity/blob/main/setup.py","dependencies":[]}],"score":16.78529713414499,"created_at":"2025-09-09T02:06:31.695Z","updated_at":"2025-10-07T08:41:24.694Z","avatar_url":"https://github.com/citiususc.png","language":"Python","category":null,"sub_category":null,"monthly_downloads":81196,"funding_links":[],"readme_doi_urls":[],"works":{},"citation_counts":{},"total_citations":0,"keywords_from_contributors":["labels"],"project_url":"https://science.ecosyste.ms/api/v1/projects/182944","html_url":"https://science.ecosyste.ms/projects/182944"}