{"id":39259,"name":"text-minhash-priority","description":"This repository implements the MinHash Near Deduplication with Priority algorithm.","url":"https://github.com/zmzhang2000/text-minhash-priority","last_synced_at":"2025-09-05T08:07:18.897Z","repository":{"id":303550303,"uuid":"1013033965","full_name":"zmzhang2000/text-minhash-priority","owner":"zmzhang2000","description":"This repository implements the MinHash Near Deduplication with Priority algorithm.","archived":false,"fork":false,"pushed_at":"2025-07-08T06:56:29.000Z","size":5784,"stargazers_count":0,"open_issues_count":0,"forks_count":0,"subscribers_count":0,"default_branch":"main","last_synced_at":"2025-07-08T07:51:38.457Z","etag":null,"topics":[],"latest_commit_sha":null,"homepage":"","language":"Python","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"apache-2.0","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/zmzhang2000.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":"LICENSE","code_of_conduct":null,"threat_model":null,"audit":null,"citation":"CITATION.bib","codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null,"zenodo":null}},"created_at":"2025-07-03T08:59:24.000Z","updated_at":"2025-07-08T06:56:32.000Z","dependencies_parsed_at":"2025-07-12T19:01:53.338Z","dependency_job_id":null,"html_url":"https://github.com/zmzhang2000/text-minhash-priority","commit_stats":null,"previous_names":["zmzhang2000/text-minhash-priority"],"tags_count":0,"template":false,"template_full_name":null,"purl":"pkg:github/zmzhang2000/text-minhash-priority","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/zmzhang2000%2Ftext-minhash-priority","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/zmzhang2000%2Ftext-minhash-priority/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/zmzhang2000%2Ftext-minhash-priority/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/zmzhang2000%2Ftext-minhash-priority/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/zmzhang2000","download_url":"https://codeload.github.com/zmzhang2000/text-minhash-priority/tar.gz/refs/heads/main","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/zmzhang2000%2Ftext-minhash-priority/sbom","scorecard":null,"host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":273728151,"owners_count":25157136,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","status":"online","status_checked_at":"2025-09-05T02:00:09.113Z","response_time":402,"last_error":null,"robots_txt_status":"success","robots_txt_updated_at":"2025-07-24T06:49:26.215Z","robots_txt_url":"https://github.com/robots.txt","online":true,"can_crawl_api":true,"host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"owner":{"login":"zmzhang2000","name":"Zongmeng Zhang","uuid":"45251366","kind":"user","description":"I am currently pursuing the master's degree in University of Science and Technology of China (USTC).","email":"","website":"https://zmzhang2000.github.io/","location":null,"twitter":null,"company":"University of Science and Technology of China","icon_url":"https://avatars.githubusercontent.com/u/45251366?v=4","repositories_count":1,"last_synced_at":"2023-05-17T03:27:20.423Z","metadata":{"has_sponsors_listing":false},"html_url":"https://github.com/zmzhang2000","funding_links":[],"total_stars":null,"followers":null,"following":null,"created_at":"2023-05-17T03:27:20.426Z","updated_at":"2023-05-17T03:27:20.426Z","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/zmzhang2000","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/zmzhang2000/repositories"},"packages":null,"commits":{"message":"Repository syncing started."},"issues_stats":{"full_name":"zmzhang2000/text-minhash-priority","html_url":"https://github.com/zmzhang2000/text-minhash-priority","last_synced_at":null,"status":null,"issues_count":null,"pull_requests_count":null,"avg_time_to_close_issue":null,"avg_time_to_close_pull_request":null,"issues_closed_count":null,"pull_requests_closed_count":null,"pull_request_authors_count":null,"issue_authors_count":null,"avg_comments_per_issue":null,"avg_comments_per_pull_request":null,"merged_pull_requests_count":null,"bot_issues_count":null,"bot_pull_requests_count":null,"past_year_issues_count":null,"past_year_pull_requests_count":null,"past_year_avg_time_to_close_issue":null,"past_year_avg_time_to_close_pull_request":null,"past_year_issues_closed_count":null,"past_year_pull_requests_closed_count":null,"past_year_pull_request_authors_count":null,"past_year_issue_authors_count":null,"past_year_avg_comments_per_issue":null,"past_year_avg_comments_per_pull_request":null,"past_year_bot_issues_count":null,"past_year_bot_pull_requests_count":null,"past_year_merged_pull_requests_count":null,"created_at":"2025-09-05T08:06:21.546Z","updated_at":"2025-09-05T08:06:21.546Z","repository_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/zmzhang2000%2Ftext-minhash-priority","issues_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/zmzhang2000%2Ftext-minhash-priority/issues","issue_labels_count":{},"pull_request_labels_count":{},"issue_author_associations_count":{},"pull_request_author_associations_count":{},"issue_authors":{},"pull_request_authors":{},"host":{"name":"GitHub","url":"https://github.com","kind":"github","last_synced_at":"2025-09-05T00:00:10.444Z","repositories_count":10094553,"issues_count":31373669,"pull_requests_count":97058592,"authors_count":10699554,"icon_url":"https://github.com/github.png","host_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories","owners_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/owners","authors_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors"},"past_year_issue_labels_count":{},"past_year_pull_request_labels_count":{},"past_year_issue_author_associations_count":{},"past_year_pull_request_author_associations_count":{},"past_year_issue_authors":{},"past_year_pull_request_authors":{},"maintainers":[],"active_maintainers":[]},"events":{"total":{"PushEvent":1},"last_year":{"PushEvent":1}},"keywords":[],"dependencies":[{"ecosystem":"actions","filepath":".github/workflows/bot.yml","sha":null,"kind":"manifest","created_at":"2025-07-08T07:51:43.002Z","updated_at":"2025-07-08T07:51:43.002Z","repository_link":"https://github.com/zmzhang2000/text-minhash-priority/blob/main/.github/workflows/bot.yml","dependencies":[{"id":24030663363,"package_name":"actions/stale","ecosystem":"actions","requirements":"v9.0.0","direct":true,"kind":"composite","optional":false}]},{"ecosystem":"actions","filepath":".github/workflows/coverage.yaml","sha":null,"kind":"manifest","created_at":"2025-07-08T07:51:43.393Z","updated_at":"2025-07-08T07:51:43.393Z","repository_link":"https://github.com/zmzhang2000/text-minhash-priority/blob/main/.github/workflows/coverage.yaml","dependencies":[{"id":24030663389,"package_name":"actions/checkout","ecosystem":"actions","requirements":"v2","direct":true,"kind":"composite","optional":false},{"id":24030663390,"package_name":"codacy/codacy-coverage-reporter-action","ecosystem":"actions","requirements":"v1","direct":true,"kind":"composite","optional":false}]},{"ecosystem":"actions","filepath":".github/workflows/docs.yaml","sha":null,"kind":"manifest","created_at":"2025-07-08T07:51:45.470Z","updated_at":"2025-07-08T07:51:45.470Z","repository_link":"https://github.com/zmzhang2000/text-minhash-priority/blob/main/.github/workflows/docs.yaml","dependencies":[{"id":24030665618,"package_name":"actions/checkout","ecosystem":"actions","requirements":"v3","direct":true,"kind":"composite","optional":false},{"id":24030665619,"package_name":"actions/setup-python","ecosystem":"actions","requirements":"v3","direct":true,"kind":"composite","optional":false},{"id":24030665620,"package_name":"actions/upload-artifact","ecosystem":"actions","requirements":"v3","direct":true,"kind":"composite","optional":false},{"id":24030665621,"package_name":"actions/deploy-pages","ecosystem":"actions","requirements":"v1","direct":true,"kind":"composite","optional":false}]},{"ecosystem":"docker","filepath":"Dockerfile","sha":null,"kind":"manifest","created_at":"2025-07-08T07:51:45.546Z","updated_at":"2025-07-08T07:51:45.546Z","repository_link":"https://github.com/zmzhang2000/text-minhash-priority/blob/main/Dockerfile","dependencies":[{"id":24030665634,"package_name":"python","ecosystem":"docker","requirements":"3.10-slim","direct":true,"kind":"build","optional":false}]},{"ecosystem":"pypi","filepath":"poetry.lock","sha":null,"kind":"lockfile","created_at":"2025-07-08T07:51:45.614Z","updated_at":"2025-07-08T07:51:45.614Z","repository_link":"https://github.com/zmzhang2000/text-minhash-priority/blob/main/poetry.lock","dependencies":[{"id":24030665996,"package_name":"absl-py","ecosystem":"pypi","requirements":"2.1.0","direct":false,"kind":"runtime","optional":false},{"id":24030665999,"package_name":"aiohttp","ecosystem":"pypi","requirements":"3.9.5","direct":false,"kind":"runtime","optional":false},{"id":24030666001,"package_name":"aiosignal","ecosystem":"pypi","requirements":"1.3.1","direct":false,"kind":"runtime","optional":false},{"id":24030666004,"package_name":"alabaster","ecosystem":"pypi","requirements":"0.7.16","direct":false,"kind":"runtime","optional":false},{"id":24030666006,"package_name":"astunparse","ecosystem":"pypi","requirements":"1.6.3","direct":false,"kind":"runtime","optional":false},{"id":24030666009,"package_name":"async-timeout","ecosystem":"pypi","requirements":"4.0.3","direct":false,"kind":"runtime","optional":false},{"id":24030666011,"package_name":"attrs","ecosystem":"pypi","requirements":"23.2.0","direct":false,"kind":"runtime","optional":false},{"id":24030666015,"package_name":"babel","ecosystem":"pypi","requirements":"2.15.0","direct":false,"kind":"runtime","optional":false},{"id":24030666017,"package_name":"bitarray","ecosystem":"pypi","requirements":"2.9.2","direct":false,"kind":"runtime","optional":false},{"id":24030666020,"package_name":"certifi","ecosystem":"pypi","requirements":"2024.2.2","direct":false,"kind":"runtime","optional":false},{"id":24030666022,"package_name":"cffi","ecosystem":"pypi","requirements":"1.16.0","direct":false,"kind":"runtime","optional":false},{"id":24030666024,"package_name":"cfgv","ecosystem":"pypi","requirements":"3.4.0","direct":false,"kind":"runtime","optional":false},{"id":24030666026,"package_name":"charset-normalizer","ecosystem":"pypi","requirements":"3.3.2","direct":false,"kind":"runtime","optional":false},{"id":24030666029,"package_name":"click","ecosystem":"pypi","requirements":"8.1.7","direct":false,"kind":"runtime","optional":false},{"id":24030666030,"package_name":"click-option-group","ecosystem":"pypi","requirements":"0.5.6","direct":false,"kind":"runtime","optional":false},{"id":24030666736,"package_name":"colorama","ecosystem":"pypi","requirements":"0.4.6","direct":false,"kind":"runtime","optional":false},{"id":24030666737,"package_name":"coloredlogs","ecosystem":"pypi","requirements":"15.0.1","direct":false,"kind":"runtime","optional":false},{"id":24030666738,"package_name":"coverage","ecosystem":"pypi","requirements":"7.5.1","direct":false,"kind":"runtime","optional":false},{"id":24030666739,"package_name":"datasets","ecosystem":"pypi","requirements":"2.19.1","direct":false,"kind":"runtime","optional":false},{"id":24030666740,"package_name":"dill","ecosystem":"pypi","requirements":"0.3.8","direct":false,"kind":"runtime","optional":false},{"id":24030666741,"package_name":"distlib","ecosystem":"pypi","requirements":"0.3.8","direct":false,"kind":"runtime","optional":false},{"id":24030666742,"package_name":"docutils","ecosystem":"pypi","requirements":"0.21.2","direct":false,"kind":"runtime","optional":false},{"id":24030666743,"package_name":"exceptiongroup","ecosystem":"pypi","requirements":"1.2.1","direct":false,"kind":"runtime","optional":false},{"id":24030666744,"package_name":"filelock","ecosystem":"pypi","requirements":"3.14.0","direct":false,"kind":"runtime","optional":false},{"id":24030666745,"package_name":"fire","ecosystem":"pypi","requirements":"0.6.0","direct":false,"kind":"runtime","optional":false},{"id":24030666746,"package_name":"flatbuffers","ecosystem":"pypi","requirements":"24.3.25","direct":false,"kind":"runtime","optional":false},{"id":24030666747,"package_name":"frozenlist","ecosystem":"pypi","requirements":"1.4.1","direct":false,"kind":"runtime","optional":false},{"id":24030666748,"package_name":"fsspec","ecosystem":"pypi","requirements":"2024.3.1","direct":false,"kind":"runtime","optional":false},{"id":24030666749,"package_name":"ftfy","ecosystem":"pypi","requirements":"6.2.0","direct":false,"kind":"runtime","optional":false},{"id":24030666750,"package_name":"gast","ecosystem":"pypi","requirements":"0.5.4","direct":false,"kind":"runtime","optional":false},{"id":24030666751,"package_name":"google-pasta","ecosystem":"pypi","requirements":"0.2.0","direct":false,"kind":"runtime","optional":false},{"id":24030666752,"package_name":"grpcio","ecosystem":"pypi","requirements":"1.64.0","direct":false,"kind":"runtime","optional":false},{"id":24030666753,"package_name":"h5py","ecosystem":"pypi","requirements":"3.11.0","direct":false,"kind":"runtime","optional":false},{"id":24030666754,"package_name":"huggingface-hub","ecosystem":"pypi","requirements":"0.23.1","direct":false,"kind":"runtime","optional":false},{"id":24030666755,"package_name":"humanfriendly","ecosystem":"pypi","requirements":"10.0","direct":false,"kind":"runtime","optional":false},{"id":24030666756,"package_name":"identify","ecosystem":"pypi","requirements":"2.5.36","direct":false,"kind":"runtime","optional":false},{"id":24030666757,"package_name":"idna","ecosystem":"pypi","requirements":"3.7","direct":false,"kind":"runtime","optional":false},{"id":24030666758,"package_name":"imagesize","ecosystem":"pypi","requirements":"1.4.1","direct":false,"kind":"runtime","optional":false},{"id":24030666759,"package_name":"iniconfig","ecosystem":"pypi","requirements":"2.0.0","direct":false,"kind":"runtime","optional":false},{"id":24030666760,"package_name":"insegel","ecosystem":"pypi","requirements":"1.3.1","direct":false,"kind":"runtime","optional":false},{"id":24030667846,"package_name":"jaxtyping","ecosystem":"pypi","requirements":"0.2.28","direct":false,"kind":"runtime","optional":false},{"id":24030667849,"package_name":"jinja2","ecosystem":"pypi","requirements":"3.1.4","direct":false,"kind":"runtime","optional":false},{"id":24030667852,"package_name":"joblib","ecosystem":"pypi","requirements":"1.4.2","direct":false,"kind":"runtime","optional":false},{"id":24030667854,"package_name":"keras","ecosystem":"pypi","requirements":"3.3.3","direct":false,"kind":"runtime","optional":false},{"id":24030667857,"package_name":"latexcodec","ecosystem":"pypi","requirements":"3.0.0","direct":false,"kind":"runtime","optional":false},{"id":24030668444,"package_name":"libclang","ecosystem":"pypi","requirements":"18.1.1","direct":false,"kind":"runtime","optional":false},{"id":24030668445,"package_name":"markdown","ecosystem":"pypi","requirements":"3.6","direct":false,"kind":"runtime","optional":false},{"id":24030668446,"package_name":"markdown-it-py","ecosystem":"pypi","requirements":"3.0.0","direct":false,"kind":"runtime","optional":false},{"id":24030668447,"package_name":"markupsafe","ecosystem":"pypi","requirements":"2.1.5","direct":false,"kind":"runtime","optional":false},{"id":24030668448,"package_name":"mdurl","ecosystem":"pypi","requirements":"0.1.2","direct":false,"kind":"runtime","optional":false},{"id":24030668449,"package_name":"ml-dtypes","ecosystem":"pypi","requirements":"0.3.2","direct":false,"kind":"runtime","optional":false},{"id":24030668450,"package_name":"mpmath","ecosystem":"pypi","requirements":"1.3.0","direct":false,"kind":"runtime","optional":false},{"id":24030668451,"package_name":"multidict","ecosystem":"pypi","requirements":"6.0.5","direct":false,"kind":"runtime","optional":false},{"id":24030668452,"package_name":"multiprocess","ecosystem":"pypi","requirements":"0.70.16","direct":false,"kind":"runtime","optional":false},{"id":24030668453,"package_name":"namex","ecosystem":"pypi","requirements":"0.0.8","direct":false,"kind":"runtime","optional":false},{"id":24030668454,"package_name":"nodeenv","ecosystem":"pypi","requirements":"1.8.0","direct":false,"kind":"runtime","optional":false},{"id":24030668455,"package_name":"numpy","ecosystem":"pypi","requirements":"1.26.4","direct":false,"kind":"runtime","optional":false},{"id":24030668456,"package_name":"onnx","ecosystem":"pypi","requirements":"1.16.0","direct":false,"kind":"runtime","optional":false},{"id":24030668457,"package_name":"onnxruntime","ecosystem":"pypi","requirements":"1.18.0","direct":false,"kind":"runtime","optional":false},{"id":24030668458,"package_name":"opt-einsum","ecosystem":"pypi","requirements":"3.3.0","direct":false,"kind":"runtime","optional":false},{"id":24030668459,"package_name":"optree","ecosystem":"pypi","requirements":"0.11.0","direct":false,"kind":"runtime","optional":false},{"id":24030668460,"package_name":"packaging","ecosystem":"pypi","requirements":"24.0","direct":false,"kind":"runtime","optional":false},{"id":24030668461,"package_name":"pandas","ecosystem":"pypi","requirements":"2.2.2","direct":false,"kind":"runtime","optional":false},{"id":24030668462,"package_name":"platformdirs","ecosystem":"pypi","requirements":"4.2.2","direct":false,"kind":"runtime","optional":false},{"id":24030668463,"package_name":"pluggy","ecosystem":"pypi","requirements":"1.5.0","direct":false,"kind":"runtime","optional":false},{"id":24030668464,"package_name":"pre-commit","ecosystem":"pypi","requirements":"3.7.1","direct":false,"kind":"runtime","optional":false},{"id":24030668465,"package_name":"protobuf","ecosystem":"pypi","requirements":"4.25.3","direct":false,"kind":"runtime","optional":false},{"id":24030668466,"package_name":"psutil","ecosystem":"pypi","requirements":"5.9.8","direct":false,"kind":"runtime","optional":false},{"id":24030668467,"package_name":"py4j","ecosystem":"pypi","requirements":"0.10.9.7","direct":false,"kind":"runtime","optional":false},{"id":24030668468,"package_name":"pyarrow","ecosystem":"pypi","requirements":"16.1.0","direct":false,"kind":"runtime","optional":false},{"id":24030668469,"package_name":"pyarrow-hotfix","ecosystem":"pypi","requirements":"0.6","direct":false,"kind":"runtime","optional":false},{"id":24030668470,"package_name":"pybloom-live","ecosystem":"pypi","requirements":"4.0.0","direct":false,"kind":"runtime","optional":false},{"id":24030668661,"package_name":"pybtex","ecosystem":"pypi","requirements":"0.24.0","direct":false,"kind":"runtime","optional":false},{"id":24030669776,"package_name":"pybtex-docutils","ecosystem":"pypi","requirements":"1.0.3","direct":false,"kind":"runtime","optional":false},{"id":24030670381,"package_name":"pycparser","ecosystem":"pypi","requirements":"2.22","direct":false,"kind":"runtime","optional":false},{"id":24030670382,"package_name":"pygments","ecosystem":"pypi","requirements":"2.18.0","direct":false,"kind":"runtime","optional":false},{"id":24030670383,"package_name":"pyreadline3","ecosystem":"pypi","requirements":"3.4.1","direct":false,"kind":"runtime","optional":false},{"id":24030670384,"package_name":"pyspark","ecosystem":"pypi","requirements":"3.5.1","direct":false,"kind":"runtime","optional":false},{"id":24030670385,"package_name":"pytest","ecosystem":"pypi","requirements":"8.2.1","direct":false,"kind":"runtime","optional":false},{"id":24030670386,"package_name":"python-dateutil","ecosystem":"pypi","requirements":"2.9.0.post0","direct":false,"kind":"runtime","optional":false},{"id":24030670387,"package_name":"pytz","ecosystem":"pypi","requirements":"2024.1","direct":false,"kind":"runtime","optional":false},{"id":24030670388,"package_name":"pyyaml","ecosystem":"pypi","requirements":"6.0.1","direct":false,"kind":"runtime","optional":false},{"id":24030670389,"package_name":"regex","ecosystem":"pypi","requirements":"2024.5.15","direct":false,"kind":"runtime","optional":false},{"id":24030670390,"package_name":"requests","ecosystem":"pypi","requirements":"2.32.2","direct":false,"kind":"runtime","optional":false},{"id":24030670391,"package_name":"rich","ecosystem":"pypi","requirements":"13.7.1","direct":false,"kind":"runtime","optional":false},{"id":24030670392,"package_name":"ruff","ecosystem":"pypi","requirements":"0.3.7","direct":false,"kind":"runtime","optional":false},{"id":24030670393,"package_name":"scikit-learn","ecosystem":"pypi","requirements":"1.5.0","direct":false,"kind":"runtime","optional":false},{"id":24030670394,"package_name":"scipy","ecosystem":"pypi","requirements":"1.13.0","direct":false,"kind":"runtime","optional":false},{"id":24030670395,"package_name":"setuptools","ecosystem":"pypi","requirements":"70.0.0","direct":false,"kind":"runtime","optional":false},{"id":24030670396,"package_name":"six","ecosystem":"pypi","requirements":"1.16.0","direct":false,"kind":"runtime","optional":false},{"id":24030670397,"package_name":"snowballstemmer","ecosystem":"pypi","requirements":"2.2.0","direct":false,"kind":"runtime","optional":false},{"id":24030670398,"package_name":"sphinx","ecosystem":"pypi","requirements":"7.3.7","direct":false,"kind":"runtime","optional":false},{"id":24030670399,"package_name":"sphinxcontrib-applehelp","ecosystem":"pypi","requirements":"1.0.8","direct":false,"kind":"runtime","optional":false},{"id":24030670400,"package_name":"sphinxcontrib-bibtex","ecosystem":"pypi","requirements":"2.6.2","direct":false,"kind":"runtime","optional":false},{"id":24030670434,"package_name":"sphinxcontrib-devhelp","ecosystem":"pypi","requirements":"1.0.6","direct":false,"kind":"runtime","optional":false},{"id":24030670435,"package_name":"sphinxcontrib-htmlhelp","ecosystem":"pypi","requirements":"2.0.5","direct":false,"kind":"runtime","optional":false},{"id":24030670436,"package_name":"sphinxcontrib-jsmath","ecosystem":"pypi","requirements":"1.0.1","direct":false,"kind":"runtime","optional":false},{"id":24030670437,"package_name":"sphinxcontrib-qthelp","ecosystem":"pypi","requirements":"1.0.7","direct":false,"kind":"runtime","optional":false},{"id":24030670438,"package_name":"sphinxcontrib-serializinghtml","ecosystem":"pypi","requirements":"1.1.10","direct":false,"kind":"runtime","optional":false},{"id":24030670439,"package_name":"sympy","ecosystem":"pypi","requirements":"1.12","direct":false,"kind":"runtime","optional":false},{"id":24030670440,"package_name":"tabulate","ecosystem":"pypi","requirements":"0.9.0","direct":false,"kind":"runtime","optional":false},{"id":24030670441,"package_name":"tensorboard","ecosystem":"pypi","requirements":"2.16.2","direct":false,"kind":"runtime","optional":false},{"id":24030670442,"package_name":"tensorboard-data-server","ecosystem":"pypi","requirements":"0.7.2","direct":false,"kind":"runtime","optional":false},{"id":24030670443,"package_name":"tensorflow","ecosystem":"pypi","requirements":"2.16.1","direct":false,"kind":"runtime","optional":false},{"id":24030670444,"package_name":"tensorflow-io-gcs-filesystem","ecosystem":"pypi","requirements":"0.37.0","direct":false,"kind":"runtime","optional":false},{"id":24030670445,"package_name":"termcolor","ecosystem":"pypi","requirements":"2.4.0","direct":false,"kind":"runtime","optional":false},{"id":24030670446,"package_name":"threadpoolctl","ecosystem":"pypi","requirements":"3.5.0","direct":false,"kind":"runtime","optional":false},{"id":24030670447,"package_name":"tomli","ecosystem":"pypi","requirements":"2.0.1","direct":false,"kind":"runtime","optional":false},{"id":24030670448,"package_name":"tqdm","ecosystem":"pypi","requirements":"4.66.4","direct":false,"kind":"runtime","optional":false},{"id":24030670449,"package_name":"typeguard","ecosystem":"pypi","requirements":"2.13.3","direct":false,"kind":"runtime","optional":false},{"id":24030670450,"package_name":"typing-extensions","ecosystem":"pypi","requirements":"4.11.0","direct":false,"kind":"runtime","optional":false},{"id":24030670451,"package_name":"tzdata","ecosystem":"pypi","requirements":"2024.1","direct":false,"kind":"runtime","optional":false},{"id":24030670452,"package_name":"unisim","ecosystem":"pypi","requirements":"0.0.1","direct":false,"kind":"runtime","optional":false},{"id":24030670510,"package_name":"urllib3","ecosystem":"pypi","requirements":"1.26.18","direct":false,"kind":"runtime","optional":false},{"id":24030670511,"package_name":"usearch","ecosystem":"pypi","requirements":"2.12.0","direct":false,"kind":"runtime","optional":false},{"id":24030670607,"package_name":"virtualenv","ecosystem":"pypi","requirements":"20.26.2","direct":false,"kind":"runtime","optional":false},{"id":24030670608,"package_name":"wcwidth","ecosystem":"pypi","requirements":"0.2.13","direct":false,"kind":"runtime","optional":false},{"id":24030670609,"package_name":"werkzeug","ecosystem":"pypi","requirements":"3.0.3","direct":false,"kind":"runtime","optional":false},{"id":24030670610,"package_name":"wheel","ecosystem":"pypi","requirements":"0.43.0","direct":false,"kind":"runtime","optional":false},{"id":24030670611,"package_name":"wrapt","ecosystem":"pypi","requirements":"1.16.0","direct":false,"kind":"runtime","optional":false},{"id":24030670612,"package_name":"xxhash","ecosystem":"pypi","requirements":"3.4.1","direct":false,"kind":"runtime","optional":false},{"id":24030670613,"package_name":"yarl","ecosystem":"pypi","requirements":"1.9.4","direct":false,"kind":"runtime","optional":false},{"id":24030670614,"package_name":"zstandard","ecosystem":"pypi","requirements":"0.22.0","direct":false,"kind":"runtime","optional":false}]},{"ecosystem":"pypi","filepath":"pyproject.toml","sha":null,"kind":"manifest","created_at":"2025-07-08T07:51:52.120Z","updated_at":"2025-07-08T07:51:52.120Z","repository_link":"https://github.com/zmzhang2000/text-minhash-priority/blob/main/pyproject.toml","dependencies":[{"id":24030670626,"package_name":"python","ecosystem":"pypi","requirements":"^3.10","direct":true,"kind":"runtime","optional":false},{"id":24030670627,"package_name":"numpy","ecosystem":"pypi","requirements":"\u003e=1.26.4","direct":true,"kind":"runtime","optional":false},{"id":24030670628,"package_name":"tqdm","ecosystem":"pypi","requirements":"\u003e=4.64.1","direct":true,"kind":"runtime","optional":false},{"id":24030670629,"package_name":"datasets","ecosystem":"pypi","requirements":"\u003e=2.17.0","direct":true,"kind":"runtime","optional":false},{"id":24030670630,"package_name":"scipy","ecosystem":"pypi","requirements":"\u003e=1.10.1","direct":true,"kind":"runtime","optional":false},{"id":24030670631,"package_name":"xxhash","ecosystem":"pypi","requirements":"\u003e=3.0.0","direct":true,"kind":"runtime","optional":false},{"id":24030670632,"package_name":"pybloom-live","ecosystem":"pypi","requirements":"\u003e=4.0.0","direct":true,"kind":"runtime","optional":false},{"id":24030670633,"package_name":"bitarray","ecosystem":"pypi","requirements":"\u003e=2.6.2","direct":true,"kind":"runtime","optional":false},{"id":24030670634,"package_name":"pyspark","ecosystem":"pypi","requirements":"\u003e=3.3.1","direct":true,"kind":"runtime","optional":false},{"id":24030670635,"package_name":"regex","ecosystem":"pypi","requirements":"\u003e=2023.5.5","direct":true,"kind":"runtime","optional":false},{"id":24030670636,"package_name":"urllib3","ecosystem":"pypi","requirements":"\u003c=2.0","direct":true,"kind":"runtime","optional":false},{"id":24030670637,"package_name":"sphinxcontrib-bibtex","ecosystem":"pypi","requirements":"\u003e=2.5.0","direct":true,"kind":"runtime","optional":false},{"id":24030670638,"package_name":"zstandard","ecosystem":"pypi","requirements":"\u003e=0.21.0","direct":true,"kind":"runtime","optional":false},{"id":24030670639,"package_name":"ftfy","ecosystem":"pypi","requirements":"\u003e=6.1.1","direct":true,"kind":"runtime","optional":false},{"id":24030670640,"package_name":"setuptools","ecosystem":"pypi","requirements":"\u003e=69.1.0","direct":true,"kind":"runtime","optional":false},{"id":24030670641,"package_name":"psutil","ecosystem":"pypi","requirements":"\u003e=5.9.8","direct":true,"kind":"runtime","optional":false},{"id":24030670642,"package_name":"fire","ecosystem":"pypi","requirements":"^0.6.0","direct":true,"kind":"runtime","optional":false},{"id":24030670643,"package_name":"click","ecosystem":"pypi","requirements":"^8.1.7","direct":true,"kind":"runtime","optional":false},{"id":24030670644,"package_name":"click-option-group","ecosystem":"pypi","requirements":"^0.5.6","direct":true,"kind":"runtime","optional":false},{"id":24030670645,"package_name":"rich","ecosystem":"pypi","requirements":"^13.7.1","direct":true,"kind":"runtime","optional":false},{"id":24030670646,"package_name":"unisim","ecosystem":"pypi","requirements":"^0.0.1","direct":true,"kind":"runtime","optional":false},{"id":24030670647,"package_name":"tensorflow","ecosystem":"pypi","requirements":"^2.16.1","direct":true,"kind":"runtime","optional":false},{"id":24030670648,"package_name":"pandarallel","ecosystem":"pypi","requirements":"^1.6.5","direct":true,"kind":"runtime","optional":false},{"id":24030671761,"package_name":"matplotlib","ecosystem":"pypi","requirements":"\u003e=3.10.3","direct":true,"kind":"runtime","optional":false},{"id":24030671762,"package_name":"pre-commit","ecosystem":"pypi","requirements":"^3.6.2","direct":true,"kind":"develop","optional":false},{"id":24030671763,"package_name":"insegel","ecosystem":"pypi","requirements":"^1.3.1","direct":true,"kind":"develop","optional":false},{"id":24030671764,"package_name":"pytest","ecosystem":"pypi","requirements":"^8.0.2","direct":true,"kind":"develop","optional":false},{"id":24030671765,"package_name":"coverage","ecosystem":"pypi","requirements":"^7.4.3","direct":true,"kind":"develop","optional":false},{"id":24030671766,"package_name":"ruff","ecosystem":"pypi","requirements":"^0.3.2","direct":true,"kind":"develop","optional":false},{"id":24030671767,"package_name":"tabulate","ecosystem":"pypi","requirements":"^0.9.0","direct":true,"kind":"develop","optional":false},{"id":24030671768,"package_name":"scikit-learn","ecosystem":"pypi","requirements":"^1.4.1.post1","direct":true,"kind":"develop","optional":false}]}],"score":null,"created_at":"2025-09-04T15:51:13.485Z","updated_at":"2025-10-07T08:16:05.383Z","avatar_url":"https://github.com/zmzhang2000.png","language":"Python","category":null,"sub_category":null,"monthly_downloads":0,"funding_links":[],"readme_doi_urls":[],"works":{},"citation_counts":{},"total_citations":0,"keywords_from_contributors":[],"project_url":"https://science.ecosyste.ms/api/v1/projects/39259","html_url":"https://science.ecosyste.ms/projects/39259","bibtex_url":"https://science.ecosyste.ms/projects/39259/export.bibtex","apalike_url":"https://science.ecosyste.ms/projects/39259/export.apalike"}