Skip to content

Commit 46f1d1c

Browse files
committed
License denotation
1 parent 392c56f commit 46f1d1c

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

65 files changed

+956
-212
lines changed

.gitignore

+1-1
Original file line numberDiff line numberDiff line change
@@ -10,7 +10,7 @@ data/data_list/sample_list.csv
1010
docs/training
1111
docs/training/*
1212
__pycache__/
13-
13+
venv/*
1414
*.pyc
1515
.idea
1616
.ipynb_checkpoints

bin/eval.py

+13-5
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,16 @@
1-
# -*- coding: utf-8 -*-
2-
# Soohwan Kim, Seyoung Bae, Cheolhwang Won.
3-
# @ArXiv : KoSpeech: Open-Source Toolkit for End-to-End Korean Speech Recognition
4-
# This source code is licensed under the Apache 2.0 License license found in the
5-
# LICENSE file in the root directory of this source tree.
1+
# Copyright (c) 2020, Soohwan Kim. All rights reserved.
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
614

715
import os
816
import sys

bin/inference.py

+14
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,17 @@
1+
# Copyright (c) 2020, Soohwan Kim. All rights reserved.
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
14+
115
import argparse
216
import torch
317
import torch.nn as nn

bin/main.py

+13-5
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,16 @@
1-
# -*- coding: utf-8 -*-
2-
# Soohwan Kim, Seyoung Bae, Cheolhwang Won.
3-
# @ArXiv : KoSpeech: Open-Source Toolkit for End-to-End Korean Speech Recognition
4-
# This source code is licensed under the Apache 2.0 License license found in the
5-
# LICENSE file in the root directory of this source tree.
1+
# Copyright (c) 2020, Soohwan Kim. All rights reserved.
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
614

715
import os
816
import random

dataset/kspon/main.py

+14
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,17 @@
1+
# Copyright (c) 2020, Soohwan Kim. All rights reserved.
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
14+
115
import argparse
216
from preprocess.grapheme import sentence_to_grapheme
317
from preprocess.preprocess import preprocess

dataset/kspon/preprocess/character.py

+14
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,17 @@
1+
# Copyright (c) 2020, Soohwan Kim. All rights reserved.
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
14+
115
import os
216
import pandas as pd
317

dataset/kspon/preprocess/grapheme.py

+14
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,17 @@
1+
# Copyright (c) 2020, Soohwan Kim. All rights reserved.
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
14+
115
import os
216
import pandas as pd
317
import unicodedata

dataset/kspon/preprocess/preprocess.py

+14
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,17 @@
1+
# Copyright (c) 2020, Soohwan Kim. All rights reserved.
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
14+
115
import os
216
import re
317

dataset/kspon/preprocess/subword.py

+14
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,17 @@
1+
# Copyright (c) 2020, Soohwan Kim. All rights reserved.
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
14+
115
import os
216
import sentencepiece as spm
317

dataset/libri/prepare-libri.py

+14
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,17 @@
1+
# Copyright (c) 2020, Soohwan Kim. All rights reserved.
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
14+
115
import argparse
216
from preprocess import (
317
collect_transcripts,

dataset/libri/preprocess.py

+14
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,17 @@
1+
# Copyright (c) 2020, Soohwan Kim. All rights reserved.
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
14+
115
import os
216
import sentencepiece as spm
317

kospeech/checkpoint/__init__.py

+14
Original file line numberDiff line numberDiff line change
@@ -1 +1,15 @@
1+
# Copyright (c) 2020, Soohwan Kim. All rights reserved.
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
14+
115
from kospeech.checkpoint.checkpoint import Checkpoint

kospeech/checkpoint/checkpoint.py

+13-5
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,16 @@
1-
# -*- coding: utf-8 -*-
2-
# Soohwan Kim, Seyoung Bae, Cheolhwang Won.
3-
# @ArXiv : KoSpeech: Open-Source Toolkit for End-to-End Korean Speech Recognition
4-
# This source code is licensed under the Apache 2.0 License license found in the
5-
# LICENSE file in the root directory of this source tree.
1+
# Copyright (c) 2020, Soohwan Kim. All rights reserved.
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
614

715
import os
816
import time

kospeech/criterion/__init__.py

+14
Original file line numberDiff line numberDiff line change
@@ -1,2 +1,16 @@
1+
# Copyright (c) 2020, Soohwan Kim. All rights reserved.
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
14+
115
from kospeech.criterion.label_smoothed_cross_entropy import LabelSmoothedCrossEntropyLoss
216
from kospeech.criterion.joint_ctc_cross_entropy import JointCTCCrossEntropyLoss

kospeech/criterion/joint_ctc_cross_entropy.py

+13-5
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,16 @@
1-
# -*- coding: utf-8 -*-
2-
# Soohwan Kim, Seyoung Bae, Cheolhwang Won.
3-
# @ArXiv : KoSpeech: Open-Source Toolkit for End-to-End Korean Speech Recognition
4-
# This source code is licensed under the Apache 2.0 License license found in the
5-
# LICENSE file in the root directory of this source tree.
1+
# Copyright (c) 2020, Soohwan Kim. All rights reserved.
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
614

715
import torch.nn as nn
816

kospeech/criterion/label_smoothed_cross_entropy.py

+13-5
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,16 @@
1-
# -*- coding: utf-8 -*-
2-
# Soohwan Kim, Seyoung Bae, Cheolhwang Won.
3-
# @ArXiv : KoSpeech: Open-Source Toolkit for End-to-End Korean Speech Recognition
4-
# This source code is licensed under the Apache 2.0 License license found in the
5-
# LICENSE file in the root directory of this source tree.
1+
# Copyright (c) 2020, Soohwan Kim. All rights reserved.
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
614

715
import torch
816
import torch.nn as nn

kospeech/data/__init__.py

+14
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,17 @@
1+
# Copyright (c) 2020, Soohwan Kim. All rights reserved.
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
14+
115
from kospeech.data.audio.parser import SpectrogramParser
216
from kospeech.data.label_loader import load_dataset
317
from kospeech.data.data_loader import (

kospeech/data/audio/__init__.py

+13-4
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,16 @@
1-
# Soohwan Kim, Seyoung Bae, Cheolhwang Won.
2-
# @ArXiv : KoSpeech: Open-Source Toolkit for End-to-End Korean Speech Recognition
3-
# This source code is licensed under the Apache 2.0 License license found in the
4-
# LICENSE file in the root directory of this source tree.
1+
# Copyright (c) 2020, Soohwan Kim. All rights reserved.
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
514

615
from dataclasses import dataclass
716

kospeech/data/audio/augment.py

+13-5
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,16 @@
1-
# -*- coding: utf-8 -*-
2-
# Soohwan Kim, Seyoung Bae, Cheolhwang Won.
3-
# @ArXiv : KoSpeech: Open-Source Toolkit for End-to-End Korean Speech Recognition
4-
# This source code is licensed under the Apache 2.0 License license found in the
5-
# LICENSE file in the root directory of this source tree.
1+
# Copyright (c) 2020, Soohwan Kim. All rights reserved.
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
614

715
import os
816
import random

kospeech/data/audio/core.py

+13-5
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,16 @@
1-
# -*- coding: utf-8 -*-
2-
# Soohwan Kim, Seyoung Bae, Cheolhwang Won.
3-
# @ArXiv : KoSpeech: Open-Source Toolkit for End-to-End Korean Speech Recognition
4-
# This source code is licensed under the Apache 2.0 License license found in the
5-
# LICENSE file in the root directory of this source tree.
1+
# Copyright (c) 2020, Soohwan Kim. All rights reserved.
2+
#
3+
# Licensed under the Apache License, Version 2.0 (the "License");
4+
# you may not use this file except in compliance with the License.
5+
# You may obtain a copy of the License at
6+
#
7+
# http://www.apache.org/licenses/LICENSE-2.0
8+
#
9+
# Unless required by applicable law or agreed to in writing, software
10+
# distributed under the License is distributed on an "AS IS" BASIS,
11+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12+
# See the License for the specific language governing permissions and
13+
# limitations under the License.
614

715
import warnings
816
import numpy as np

0 commit comments

Comments
 (0)