{"id":5621,"name":"ticcltools","description":"Tools for TICCL","url":"https://github.com/languagemachines/ticcltools","last_synced_at":"2025-09-04T18:45:37.305Z","repository":{"id":60721907,"uuid":"45118973","full_name":"LanguageMachines/ticcltools","owner":"LanguageMachines","description":"Tools for TICCL","archived":false,"fork":false,"pushed_at":"2025-06-10T12:28:21.000Z","size":260294,"stargazers_count":14,"open_issues_count":17,"forks_count":4,"subscribers_count":7,"default_branch":"master","last_synced_at":"2025-08-23T05:49:31.801Z","etag":null,"topics":[],"latest_commit_sha":null,"homepage":null,"language":"C++","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"gpl-3.0","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/LanguageMachines.png","metadata":{"files":{"readme":"README","changelog":"NEWS","contributing":null,"funding":null,"license":"COPYING","code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":"AUTHORS","dei":null,"publiccode":null,"codemeta":"codemeta.json","zenodo":null}},"created_at":"2015-10-28T14:42:46.000Z","updated_at":"2024-12-16T10:36:45.000Z","dependencies_parsed_at":"2025-04-10T15:22:45.286Z","dependency_job_id":null,"html_url":"https://github.com/LanguageMachines/ticcltools","commit_stats":{"total_commits":790,"total_committers":5,"mean_commits":158.0,"dds":"0.11392405063291144","last_synced_commit":"07b30f98bd2c5b5d89069eea660917c3fd64e718"},"previous_names":[],"tags_count":9,"template":false,"template_full_name":null,"purl":"pkg:github/LanguageMachines/ticcltools","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/LanguageMachines%2Fticcltools","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/LanguageMachines%2Fticcltools/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/LanguageMachines%2Fticcltools/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/LanguageMachines%2Fticcltools/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/LanguageMachines","download_url":"https://codeload.github.com/LanguageMachines/ticcltools/tar.gz/refs/heads/master","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/LanguageMachines%2Fticcltools/sbom","scorecard":null,"host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":273656518,"owners_count":25145001,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","status":"online","status_checked_at":"2025-09-04T02:00:08.968Z","response_time":61,"last_error":null,"robots_txt_status":"success","robots_txt_updated_at":"2025-07-24T06:49:26.215Z","robots_txt_url":"https://github.com/robots.txt","online":true,"can_crawl_api":true,"host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"owner":{"login":"LanguageMachines","name":"Language Machines","uuid":"3313855","kind":"organization","description":"NLP Research group at Centre for Language Studies, Radboud University Nijmegen","email":"proycon@anaproy.nl","website":"http://cls.ru.nl/languagemachines","location":"Nijmegen, The Netherlands","twitter":null,"company":null,"icon_url":"https://avatars.githubusercontent.com/u/3313855?v=4","repositories_count":53,"last_synced_at":"2024-03-26T13:57:21.115Z","metadata":{"has_sponsors_listing":false},"html_url":"https://github.com/LanguageMachines","funding_links":[],"total_stars":343,"followers":6,"following":0,"created_at":"2022-11-03T20:54:46.619Z","updated_at":"2024-03-26T13:57:22.047Z","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/LanguageMachines","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/LanguageMachines/repositories"},"packages":[{"id":5293957,"name":"ticcltools","ecosystem":"conda","description":"TicclTools is a collection of programs to process datafiles, together they constitute the bulk of TICCL: Text Induced Corpus-Cleanup. The main programs in this colection are: * TICCL-indexer and TICCL-indexerNT:   a tool to create an exhaustive index to all lexical variants given a particular Levenshtein or edit distance in a corpus. * TICCL-anahash:   a tool to create anagram hashes form a word frequency file. Also creates ab 'alphabet' file of the unicode characters that are present in the corpus. * TICCL-LDcalc:   a proprocessing tool for TICCL-rank. Gathers the info from TICC-anahash, TICCL-indexer, TICCL-lexstat and TICCL-unk * TICCL-rank:   ranks a word varian list according to al lot of criteria * TICCL-unk:   a cleanup tool for word frequency lists. creates a 'clean' file with desirable words, an 'unk' file with uncorrectable words and a 'punct' file with words that would be clean after removing puncuation. * TICCL-lexstat:   convert an 'alphabet' file (from TICCL-anahash) into a frequency list of hashes and optionally a list of confusions.","homepage":"https://github.com/LanguageMachines/ticcltools","licenses":"GPL-3.0-only","normalized_licenses":["GPL-3.0-only"],"repository_url":"https://github.com/LanguageMachines/ticcltools","keywords_array":[],"namespace":null,"versions_count":4,"first_release_published_at":"2019-01-30T17:24:54.000Z","latest_release_published_at":"2021-02-04T14:42:36.000Z","latest_release_number":"0.7.1","last_synced_at":"2025-08-16T07:04:58.047Z","created_at":"2022-10-03T15:56:06.204Z","updated_at":"2025-08-16T07:04:58.047Z","registry_url":"https://anaconda.org/conda-forge/ticcltools","install_command":"conda install -c conda-forge ticcltools","documentation_url":null,"metadata":{},"repo_metadata":{"uuid":"45118973","full_name":"LanguageMachines/ticcltools","owner":"LanguageMachines","description":"Tools for TICCL","archived":false,"fork":false,"pushed_at":"2023-03-01T10:47:49.000Z","size":244418,"stargazers_count":13,"open_issues_count":18,"forks_count":3,"subscribers_count":7,"default_branch":"master","last_synced_at":"2023-03-13T21:02:09.571Z","etag":null,"topics":[],"latest_commit_sha":null,"homepage":null,"language":"C++","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"gpl-3.0","status":null,"scm":"git","pull_requests_enabled":true,"logo_url":null,"metadata":{"files":{"readme":"README","changelog":null,"contributing":null,"funding":null,"license":"COPYING","code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null}},"created_at":"2015-10-28T14:42:46.000Z","updated_at":"2023-01-26T15:46:19.000Z","dependencies_parsed_at":"2023-02-01T04:00:19.011Z","dependency_job_id":null,"html_url":"https://github.com/LanguageMachines/ticcltools","commit_stats":null,"repository_url":"http://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/LanguageMachines%2Fticcltools","tags_url":"http://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/LanguageMachines%2Fticcltools/tags","manifests_url":"http://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/LanguageMachines%2Fticcltools/manifests","owner_url":"http://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/LanguageMachines","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":108921946,"host_url":"http://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"http://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"http://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names"},"owner_record":{"login":"LanguageMachines","name":"Language Machines","uuid":"3313855","kind":"organization","description":"NLP Research group at Centre for Language Studies, Radboud University Nijmegen","email":"proycon@anaproy.nl","website":"http://cls.ru.nl/languagemachines","location":"Nijmegen, The Netherlands","twitter":null,"company":null,"avatar_url":"https://avatars.githubusercontent.com/u/3313855?v=4","repositories_count":17,"last_synced_at":"2023-02-16T11:05:10.845Z","metadata":{"has_sponsors_listing":false},"owner_url":"http://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/LanguageMachines"},"tags":[{"name":"v0.9","sha":"f7d44e19b4b7db4619c98681cab098489f812d9d","kind":"commit","published_at":"2022-09-13T18:13:30.000Z","download_url":"https://codeload.github.com/LanguageMachines/ticcltools/tar.gz/v0.9","html_url":"https://github.com/LanguageMachines/ticcltools/releases/tag/v0.9"},{"name":"v0.8","sha":"82c8b291b69971e82f3756909ee319c381b4bc8d","kind":"commit","published_at":"2021-12-15T14:41:46.000Z","download_url":"https://codeload.github.com/LanguageMachines/ticcltools/tar.gz/v0.8","html_url":"https://github.com/LanguageMachines/ticcltools/releases/tag/v0.8"},{"name":"v0.7.1","sha":"9b25e32c8f916c723d10c2571e7d8af192d62192","kind":"commit","published_at":"2020-09-15T11:03:13.000Z","download_url":"https://codeload.github.com/LanguageMachines/ticcltools/tar.gz/v0.7.1","html_url":"https://github.com/LanguageMachines/ticcltools/releases/tag/v0.7.1"},{"name":"v0.7","sha":"04b114879de0c9f558fc8d0a6e262e4c33b2014f","kind":"commit","published_at":"2020-04-15T13:01:04.000Z","download_url":"https://codeload.github.com/LanguageMachines/ticcltools/tar.gz/v0.7","html_url":"https://github.com/LanguageMachines/ticcltools/releases/tag/v0.7"},{"name":"v0.6","sha":"1d5c4a4ef9401db6058afb469aa76a992d8f73d7","kind":"commit","published_at":"2018-06-05T10:46:54.000Z","download_url":"https://codeload.github.com/LanguageMachines/ticcltools/tar.gz/v0.6","html_url":"https://github.com/LanguageMachines/ticcltools/releases/tag/v0.6"},{"name":"v0.5","sha":"63c3121e462b115041d5895fed65c9cc76d55e83","kind":"commit","published_at":"2018-02-19T14:54:53.000Z","download_url":"https://codeload.github.com/LanguageMachines/ticcltools/tar.gz/v0.5","html_url":"https://github.com/LanguageMachines/ticcltools/releases/tag/v0.5"},{"name":"v0.4","sha":"2cf77745bee0c736a4db7af8faa39af704847b96","kind":"commit","published_at":"2017-04-04T10:37:38.000Z","download_url":"https://codeload.github.com/LanguageMachines/ticcltools/tar.gz/v0.4","html_url":"https://github.com/LanguageMachines/ticcltools/releases/tag/v0.4"}]},"repo_metadata_updated_at":"2023-03-22T07:26:43.945Z","dependent_packages_count":0,"downloads":null,"downloads_period":null,"dependent_repos_count":0,"rankings":{"downloads":null,"dependent_repos_count":34.025455452957324,"dependent_packages_count":51.17544297479411,"stargazers_count":48.93436486149239,"forks_count":51.64462191165461,"average":46.44497130022461},"purl":"pkg:conda/ticcltools","advisories":[],"docker_usage_url":"https://docker.ecosyste.ms/usage/conda/ticcltools","docker_dependents_count":null,"docker_downloads_count":null,"usage_url":"https://repos.ecosyste.ms/usage/conda/ticcltools","dependent_repositories_url":"https://repos.ecosyste.ms/api/v1/usage/conda/ticcltools/dependencies","status":null,"funding_links":[],"critical":null,"issue_metadata":{"last_synced_at":"2023-08-09T03:48:40.470Z","issues_count":46,"pull_requests_count":0,"avg_time_to_close_issue":10184127.407407407,"avg_time_to_close_pull_request":null,"issues_closed_count":27,"pull_requests_closed_count":0,"pull_request_authors_count":0,"issue_authors_count":7,"avg_comments_per_issue":4.478260869565218,"avg_comments_per_pull_request":null,"merged_pull_requests_count":0,"bot_issues_count":0,"bot_pull_requests_count":0,"past_year_issues_count":2,"past_year_pull_requests_count":0,"past_year_avg_time_to_close_issue":null,"past_year_avg_time_to_close_pull_request":null,"past_year_issues_closed_count":0,"past_year_pull_requests_closed_count":0,"past_year_pull_request_authors_count":0,"past_year_issue_authors_count":2,"past_year_avg_comments_per_issue":3.0,"past_year_avg_comments_per_pull_request":null,"past_year_bot_issues_count":0,"past_year_bot_pull_requests_count":0,"past_year_merged_pull_requests_count":0},"versions_url":"https://packages.ecosyste.ms/api/v1/registries/conda-forge.org/packages/ticcltools/versions","version_numbers_url":"https://packages.ecosyste.ms/api/v1/registries/conda-forge.org/packages/ticcltools/version_numbers","dependent_packages_url":"https://packages.ecosyste.ms/api/v1/registries/conda-forge.org/packages/ticcltools/dependent_packages","related_packages_url":"https://packages.ecosyste.ms/api/v1/registries/conda-forge.org/packages/ticcltools/related_packages","maintainers":[],"registry":{"name":"conda-forge.org","url":"https://conda-forge.org","ecosystem":"conda","default":false,"packages_count":20636,"maintainers_count":0,"namespaces_count":0,"keywords_count":13387,"github":"conda-forge","metadata":{"kind":"conda-forge","key":"CondaForge","api":"https://conda.anaconda.org","funded_packages_count":2180},"icon_url":"https://github.com/conda-forge.png","created_at":"2022-10-03T15:37:08.743Z","updated_at":"2025-09-04T07:00:12.892Z","packages_url":"https://packages.ecosyste.ms/api/v1/registries/conda-forge.org/packages","maintainers_url":"https://packages.ecosyste.ms/api/v1/registries/conda-forge.org/maintainers","namespaces_url":"https://packages.ecosyste.ms/api/v1/registries/conda-forge.org/namespaces"}}],"commits":{"id":29786,"full_name":"LanguageMachines/ticcltools","default_branch":"master","committers":[{"name":"Ko van der Sloot","email":"K.vanderSloot@let.ru.nl","count":700},{"name":"Ko van der Sloot","email":"Ko.vanderSloot@ziggo.nl","count":48},{"name":"martinreynaert","email":"martinreynaert@users.noreply.github.com","count":24},{"name":"Maarten van Gompel","email":"proycon@anaproy.nl","count":10},{"name":"sloot","email":"sloot@12f355fe-0486-481a-ad91-c297ab22b4e3","count":8}],"total_commits":790,"total_committers":5,"total_bot_commits":0,"total_bot_committers":0,"mean_commits":158.0,"dds":0.11392405063291144,"past_year_committers":[{"name":"Ko van der Sloot","email":"Ko.vanderSloot@ziggo.nl","count":33},{"name":"Maarten van Gompel","email":"proycon@anaproy.nl","count":5}],"past_year_total_commits":38,"past_year_total_committers":2,"past_year_total_bot_commits":0,"past_year_total_bot_committers":0,"past_year_mean_commits":19.0,"past_year_dds":0.13157894736842102,"last_synced_at":"2023-04-26T14:43:28.094Z","last_synced_commit":"07b30f98bd2c5b5d89069eea660917c3fd64e718","created_at":"2023-03-07T16:41:59.004Z","updated_at":"2023-09-19T15:43:10.640Z","commits_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub/repositories/LanguageMachines%2Fticcltools/commits","host":{"name":"GitHub","url":"https://github.com","kind":"github","last_synced_at":"2025-09-04T00:00:25.936Z","repositories_count":5480019,"commits_count":853389012,"contributors_count":31098138,"owners_count":906558,"icon_url":"https://github.com/github.png","host_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://commits.ecosyste.ms/api/v1/hosts/GitHub/repositories"}},"issues_stats":{"full_name":"LanguageMachines/ticcltools","html_url":"https://github.com/LanguageMachines/ticcltools","last_synced_at":"2024-12-04T09:14:51.231Z","status":null,"issues_count":47,"pull_requests_count":0,"avg_time_to_close_issue":17704165.666666668,"avg_time_to_close_pull_request":null,"issues_closed_count":30,"pull_requests_closed_count":0,"pull_request_authors_count":0,"issue_authors_count":7,"avg_comments_per_issue":4.468085106382978,"avg_comments_per_pull_request":null,"merged_pull_requests_count":0,"bot_issues_count":0,"bot_pull_requests_count":0,"past_year_issues_count":1,"past_year_pull_requests_count":0,"past_year_avg_time_to_close_issue":14604.0,"past_year_avg_time_to_close_pull_request":null,"past_year_issues_closed_count":1,"past_year_pull_requests_closed_count":0,"past_year_pull_request_authors_count":0,"past_year_issue_authors_count":1,"past_year_avg_comments_per_issue":2.0,"past_year_avg_comments_per_pull_request":null,"past_year_bot_issues_count":0,"past_year_bot_pull_requests_count":0,"past_year_merged_pull_requests_count":0,"created_at":"2023-05-10T21:15:53.896Z","updated_at":"2025-09-01T10:24:27.931Z","repository_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/LanguageMachines%2Fticcltools","issues_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories/LanguageMachines%2Fticcltools/issues","issue_labels_count":{"enhancement":20,"testing":4,"bug":3,"invalid":1,"help wanted":1,"question":1},"pull_request_labels_count":{},"issue_author_associations_count":{"COLLABORATOR":39,"MEMBER":4,"NONE":4},"pull_request_author_associations_count":{},"issue_authors":{"martinreynaert":21,"kosloot":18,"proycon":4,"egpbos":1,"tokee":1,"VincentCCL":1,"peterdekker":1},"pull_request_authors":{},"host":{"name":"GitHub","url":"https://github.com","kind":"github","last_synced_at":"2025-09-02T00:00:07.986Z","repositories_count":10046920,"issues_count":30704063,"pull_requests_count":91816424,"authors_count":10486554,"icon_url":"https://github.com/github.png","host_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/repositories","owners_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/owners","authors_url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors"},"past_year_issue_labels_count":{},"past_year_pull_request_labels_count":{},"past_year_issue_author_associations_count":{},"past_year_pull_request_author_associations_count":{},"past_year_issue_authors":{},"past_year_pull_request_authors":{},"maintainers":[{"login":"martinreynaert","count":21,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/martinreynaert"},{"login":"kosloot","count":18,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/kosloot"},{"login":"proycon","count":4,"url":"https://issues.ecosyste.ms/api/v1/hosts/GitHub/authors/proycon"}],"active_maintainers":[]},"events":{"total":{"ReleaseEvent":1,"PushEvent":2,"ForkEvent":1,"CreateEvent":1},"last_year":{"ReleaseEvent":1,"PushEvent":2,"ForkEvent":1,"CreateEvent":1}},"keywords":[],"dependencies":[{"ecosystem":"docker","filepath":"Dockerfile","sha":null,"kind":"manifest","created_at":"2023-02-01T04:00:19.002Z","updated_at":"2023-02-01T04:00:19.002Z","repository_link":"https://github.com/LanguageMachines/ticcltools/blob/master/Dockerfile","dependencies":[{"id":7288819209,"package_name":"alpine","ecosystem":"docker","requirements":"latest","direct":true,"kind":"build","optional":false}]},{"ecosystem":"actions","filepath":".github/workflows/cleanup.yml","sha":null,"kind":"manifest","created_at":"2023-11-14T19:51:11.900Z","updated_at":"2023-11-14T19:51:11.900Z","repository_link":"https://github.com/LanguageMachines/ticcltools/blob/master/.github/workflows/cleanup.yml","dependencies":[{"id":14499335492,"package_name":"Mattraks/delete-workflow-runs","ecosystem":"actions","requirements":"v2","direct":true,"kind":"composite","optional":false}]},{"ecosystem":"actions","filepath":".github/workflows/ticcltools.yml","sha":null,"kind":"manifest","created_at":"2023-11-14T19:51:12.015Z","updated_at":"2023-11-14T19:51:12.015Z","repository_link":"https://github.com/LanguageMachines/ticcltools/blob/master/.github/workflows/ticcltools.yml","dependencies":[{"id":14499335645,"package_name":"Gottox/irc-message-action","ecosystem":"actions","requirements":"v2","direct":true,"kind":"composite","optional":false},{"id":14499335710,"package_name":"styfle/cancel-workflow-action","ecosystem":"actions","requirements":"0.11.0","direct":true,"kind":"composite","optional":false},{"id":14499335711,"package_name":"actions/checkout","ecosystem":"actions","requirements":"v3","direct":true,"kind":"composite","optional":false}]}],"score":null,"created_at":"2025-09-04T15:50:16.639Z","updated_at":"2025-11-04T15:50:44.278Z","avatar_url":"https://github.com/LanguageMachines.png","language":"C++","category":null,"sub_category":null,"monthly_downloads":0,"funding_links":[],"readme_doi_urls":[],"works":{},"citation_counts":{},"total_citations":0,"keywords_from_contributors":["computational-linguistics","language-modelling","lm"],"project_url":"https://science.ecosyste.ms/api/v1/projects/5621","html_url":"https://science.ecosyste.ms/projects/5621"}