{"payload":{"pageCount":2,"repositories":[{"type":"Public","name":"demint","owner":"transducens","isFork":false,"description":"Repository for the project \"DeMINT: Automated Language Debriefing for English Learners via AI Chatbot Analysis of Meeting Transcripts\"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":5,"starsCount":3,"forksCount":0,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-09T13:17:25.501Z"}},{"type":"Public","name":"transducens-website","owner":"transducens","isFork":false,"description":"Markdown and static files for the Transducens research group's website.","allTopics":[],"primaryLanguage":{"name":"HTML","color":"#e34c26"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-30T10:04:56.788Z"}},{"type":"Public","name":"PILAR","owner":"transducens","isFork":false,"description":"","allTopics":[],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":3,"forksCount":0,"license":"Creative Commons Zero v1.0 Universal","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-29T11:16:19.260Z"}},{"type":"Public","name":"wmt2024-romance-tests","owner":"transducens","isFork":false,"description":"Repository containing the test files for the WMT24 Shared Task: Translation into Low-Resource Languages of Spain","allTopics":[],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-23T06:26:30.784Z"}},{"type":"Public","name":"mayanv","owner":"transducens","isFork":false,"description":"Hosts a number of bilingual Mayan-Spanish corpora","allTopics":[],"primaryLanguage":{"name":"JavaScript","color":"#f1e05a"},"pullRequestCount":0,"issueCount":0,"starsCount":3,"forksCount":1,"license":"Creative Commons Zero v1.0 Universal","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-16T14:59:42.532Z"}},{"type":"Public","name":"compiladores","owner":"transducens","isFork":false,"description":"Código fuente del libro \"Diseño de compiladores\"","allTopics":[],"primaryLanguage":{"name":"TeX","color":"#3D6117"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":0,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-29T14:17:48.996Z"}},{"type":"Public","name":"idiomata_cognitor","owner":"transducens","isFork":false,"description":"Language identifier for Romance languages","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":1,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-25T09:27:45.201Z"}},{"type":"Public","name":"nmt-maya","owner":"transducens","isFork":false,"description":"Hosts code to train bilingual and multilingual NMT models of Mayan languages","allTopics":[],"primaryLanguage":{"name":"JavaScript","color":"#f1e05a"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-22T11:49:31.633Z"}},{"type":"Public","name":"parallel-urls-classifier","owner":"transducens","isFork":false,"description":"Parallel URLs Classifier (PUC) infers the parallelness of a pair of documents from their URLs","allTopics":["url","crawling","document-aligner"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":1,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-18T18:03:05.355Z"}},{"type":"Public","name":"url2lang","owner":"transducens","isFork":false,"description":"url2lang infers the language of a document from its URL","allTopics":["url","crawling","language-identification"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":1,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-15T13:49:48.116Z"}},{"type":"Public","name":"linguacrawl","owner":"transducens","isFork":false,"description":"Crawling engine that crawls a set of top-level domains looking for documents in a list of languages","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":3,"issueCount":2,"starsCount":11,"forksCount":3,"license":"GNU General Public License v3.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-06T17:12:18.092Z"}},{"type":"Public","name":"jw_crawler","owner":"transducens","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-11T13:11:09.725Z"}},{"type":"Public","name":"MaTiLDA","owner":"transducens","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":"GNU General Public License v3.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-11-28T15:13:07.739Z"}},{"type":"Public","name":"mtl-da-emnlp","owner":"transducens","isFork":false,"description":"Code to reproduce the experiments presented in the EMNLP 2021 paper \"Rethinking data augmentation for low-resource neural machine translation: a multi-task learning approach\"","allTopics":[],"primaryLanguage":{"name":"Shell","color":"#89e051"},"pullRequestCount":0,"issueCount":1,"starsCount":5,"forksCount":2,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-11-28T10:47:36.533Z"}},{"type":"Public","name":"trad-automatica-neuronal-valenciano","owner":"transducens","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"JavaScript","color":"#f1e05a"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":"GNU General Public License v3.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-11-24T12:19:27.309Z"}},{"type":"Public","name":"CrossLingualNeuralFMS","owner":"transducens","isFork":false,"description":"Code to reproduce the experiments reported in the paper \"Cross-lingual neural fuzzy matching for exploiting target-language monolingual corpora in computer-aided translation\" published in EMNLP 2022","allTopics":[],"primaryLanguage":{"name":"Java","color":"#b07219"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":0,"license":"GNU General Public License v3.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-12-09T15:54:11.757Z"}},{"type":"Public","name":"tune-n-distill","owner":"transducens","isFork":false,"description":"Exploiting large pre-trained models for low-resource neural machine translation","allTopics":[],"primaryLanguage":{"name":"Shell","color":"#89e051"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-06-30T12:07:09.798Z"}},{"type":"Public","name":"biwords","owner":"transducens","isFork":false,"description":"Processing of word alignments for compressing parallel corpora","allTopics":[],"primaryLanguage":{"name":"C++","color":"#f34b7d"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":"GNU General Public License v2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2021-10-21T14:33:49.779Z"}},{"type":"Public","name":"bitext2bilexicon","owner":"transducens","isFork":false,"description":"Tool that allows to build a bilingual lexicon from a parallel corpus","allTopics":[],"primaryLanguage":{"name":"Shell","color":"#89e051"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2021-08-31T09:58:27.102Z"}},{"type":"Public","name":"python-Levenshtein","owner":"transducens","isFork":true,"description":"The Levenshtein Python C extension module contains functions for fast computation of Levenshtein distance and string similarity","allTopics":[],"primaryLanguage":{"name":"C","color":"#555555"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":229,"license":"GNU General Public License v2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2021-08-11T16:38:39.016Z"}},{"type":"Public","name":"bayeseq","owner":"transducens","isFork":true,"description":"Auto-encoding variational Bayesian inference for sequence generation models.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":10,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2021-01-20T11:54:38.828Z"}},{"type":"Public","name":"smart-segmentation","owner":"transducens","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Shell","color":"#89e051"},"pullRequestCount":0,"issueCount":0,"starsCount":2,"forksCount":0,"license":"GNU General Public License v3.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2020-10-12T20:59:21.214Z"}},{"type":"Public","name":"OmegaT-FuzzyMatchRepair-Plugin","owner":"transducens","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Java","color":"#b07219"},"pullRequestCount":0,"issueCount":1,"starsCount":0,"forksCount":2,"license":"GNU General Public License v3.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2020-05-04T08:44:18.102Z"}},{"type":"Public","name":"gourmet-ua","owner":"transducens","isFork":false,"description":"Developments of UA for the EU project GoURMET","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2020-02-03T16:05:03.419Z"}},{"type":"Public","name":"JSONL2bitextor","owner":"transducens","isFork":false,"description":"Script and instructions to produce a Bitextor-compatible parallel-data-extraction task from JSONL files as provided by BBC","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2019-12-20T10:52:43.828Z"}},{"type":"Public","name":"LASERtrain","owner":"transducens","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":22,"forksCount":5,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2019-12-20T10:51:33.688Z"}},{"type":"Public","name":"LASER","owner":"transducens","isFork":true,"description":"Language-Agnostic SEntence Representations","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":459,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2019-06-26T15:03:28.024Z"}},{"type":"Public","name":"Forecat-OmegaT","owner":"transducens","isFork":false,"description":"Plugin that adds the functionality of Forecat (https://github.com/jaspock/forecat) to OmegaT.","allTopics":[],"primaryLanguage":{"name":"Java","color":"#b07219"},"pullRequestCount":0,"issueCount":7,"starsCount":8,"forksCount":0,"license":"GNU General Public License v3.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2018-06-12T17:17:34.579Z"}},{"type":"Public","name":"forecat","owner":"transducens","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Java","color":"#b07219"},"pullRequestCount":0,"issueCount":0,"starsCount":8,"forksCount":1,"license":"GNU Affero General Public License v3.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2017-08-22T12:05:04.135Z"}},{"type":"Public","name":"cachetrans-omegat","owner":"transducens","isFork":false,"description":"Dumb translation engine that pulls translations from a text file.","allTopics":[],"primaryLanguage":{"name":"Java","color":"#b07219"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":0,"license":"GNU General Public License v3.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2017-07-10T15:23:04.594Z"}}],"repositoryCount":39,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"transducens repositories"}