{"payload":{"pageCount":1,"repositories":[{"type":"Public","name":"IMS-Toucan","owner":"DigitalPhonetics","isFork":false,"description":"Multilingual and Controllable Text-to-Speech Toolkit of the Speech and Language Technologies Group at the University of Stuttgart.","allTopics":["text-to-speech","deep-learning","toolkit","speech","pytorch","tts","speech-synthesis","speech-processing"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":471,"forksCount":85,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-11T11:39:19.020Z"}},{"type":"Public","name":"Intrinsic-Subgraph-Generation-for-VQA","owner":"DigitalPhonetics","isFork":false,"description":"","allTopics":["interpretability","explainable-ai","graph-neural-networks","interpreatable-ai","subgraph-extraction","graph-based-vqa"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":5,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-20T12:42:42.465Z"}},{"type":"Public","name":"VoicePAT","owner":"DigitalPhonetics","isFork":false,"description":"VoicePAT is a modular and efficient toolkit for voice privacy research, with main focus on speaker anonymization.","allTopics":[],"primaryLanguage":{"name":"Shell","color":"#89e051"},"pullRequestCount":0,"issueCount":2,"starsCount":44,"forksCount":4,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,2,2,0,0,2,0,0,0,0,0,2,7,3,0,23,19,0,0,4,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-14T12:33:23.380Z"}},{"type":"Public","name":"bloomzmms","owner":"DigitalPhonetics","isFork":false,"description":"Materials for the publication \"Teaching a Multilingual Large Language Model to Understand Multilingual Speech via Multi-Instructional Training\"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":null,"participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,3,0,4,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-16T21:21:05.216Z"}},{"type":"Public","name":"conversational-tree-search","owner":"DigitalPhonetics","isFork":false,"description":"Code and Data for Conversational Tree Search: A new task that bridges the gap between FAQ-style information retrieval and task-oriented dialog.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":5,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-22T14:13:02.530Z"}},{"type":"Public","name":"speaker-anonymization","owner":"DigitalPhonetics","isFork":false,"description":"Speaker anonymization pipeline for hiding the identity of the speaker of a recording by changing the voice in it.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":2,"starsCount":44,"forksCount":4,"license":"GNU General Public License v3.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-14T14:11:42.565Z"}},{"type":"Public","name":"hard-negative-captions","owner":"DigitalPhonetics","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":4,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-23T13:58:12.901Z"}},{"type":"Public","name":"diagraph","owner":"DigitalPhonetics","isFork":false,"description":"DIAGRAPH: An open-source graphic interface for dialog flow design","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":2,"forksCount":0,"license":"GNU General Public License v3.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-23T09:51:40.652Z"}},{"type":"Public","name":"multilingual-seq2seq-slu","owner":"DigitalPhonetics","isFork":false,"description":"Materials for the publication \"Leveraging Multilingual Self-Supervised Pretrained Models for Sequence-to-Sequence End-to-End Spoken Language Understanding\"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":2,"forksCount":0,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-11T10:47:51.906Z"}},{"type":"Public","name":"adviser","owner":"DigitalPhonetics","isFork":false,"description":"ADvISER is a flexible framework to encourage task-oriented dialog system research & development ","allTopics":["machine-learning","framework","reinforcement-learning","toolkit","dialogue","dialogue-systems","task-oriented-dialogue","multimodal"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":8,"issueCount":3,"starsCount":55,"forksCount":32,"license":"GNU General Public License v3.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-08-14T22:44:14.565Z"}},{"type":"Public","name":"BetterFinetuning","owner":"DigitalPhonetics","isFork":false,"description":"Code accompanying our paper on finetuning self-supervised general speech representations with a combination of contrastive and non-contrastive methods.","allTopics":["speech-embedding","self-supervised-learning"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":1,"forksCount":0,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-10-05T23:26:20.593Z"}},{"type":"Public","name":"IMS-Speech","owner":"DigitalPhonetics","isFork":false,"description":"IMS-Speech is a tool for German, English and Russian speech transcription aiming to facilitate research in various disciplines. We are willing to provide a speech transcription service with an intuitive web interface accessible with a wide range of computing devices and to people with various backgrounds. Our service is available here: https://7…","allTopics":[],"primaryLanguage":{"name":"Go","color":"#00ADD8"},"pullRequestCount":0,"issueCount":1,"starsCount":5,"forksCount":2,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2022-05-13T10:33:42.951Z"}},{"type":"Public","name":"Our_Fault","owner":"DigitalPhonetics","isFork":false,"description":"A collaborative dialog game playable by a human and an AI system, designed to better understand how users view such an AI partner. The repository contains code for the game as well as dialog logs, survey responses, and annotations from a user study conducted with this scenario.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":"GNU General Public License v3.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2021-11-10T08:47:43.137Z"}},{"type":"Public","name":"ethics_in_chatbot_design","owner":"DigitalPhonetics","isFork":false,"description":"A project exploring ethical implications of chatbot design, in particular affective language style. The repository contains code, survey responses, and annotated data for the experiment conducted using this implementation.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":"GNU General Public License v3.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2021-11-09T12:31:48.309Z"}},{"type":"Public","name":"cyclegan-emotion-transfer","owner":"DigitalPhonetics","isFork":false,"description":"CycleGAN-based Emotion Style Transfer as Data Augmentation for Speech Emotion Recognition","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":11,"forksCount":1,"license":"GNU General Public License v3.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2019-10-07T08:42:31.426Z"}},{"type":"Public","name":"nlg-eval","owner":"DigitalPhonetics","isFork":false,"description":"Code accompanying the INLG 2018 paper Sequence-to-Sequence Models for Data-to-Text Natural Language Generation: Word- vs. Character-based Processing and Output Diversity","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":6,"forksCount":0,"license":"GNU General Public License v3.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2019-08-30T07:07:02.583Z"}},{"type":"Public","name":"reading-comprehension","owner":"DigitalPhonetics","isFork":false,"description":"Comparing attention-based convolutional and recurrent neural networks under adversarial attacks to investigate their success and limitations in machine reading comprehension","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":10,"forksCount":3,"license":"GNU General Public License v3.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2018-08-24T13:29:57.362Z"}}],"repositoryCount":17,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"Repositories"}