Wanlau commited on
Commit
24ee3f3
·
1 Parent(s): 85b8be3
Ako_v2/Ako_v2.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:a988c72eef59b4dbc91da37eb4d59ef60de66cc892734abbdb0fb549ff33ae40
3
- size 55222767
 
 
 
 
Ako_v2/added_IVF256_Flat_nprobe_1_Ako_v2_v2.index DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:d0b2ff679c63a0d24eb6c52ecd0acc71e1cea5afff7ce948428358ae1e214754
3
- size 31588619
 
 
 
 
Ako_v2/config.json DELETED
@@ -1,79 +0,0 @@
1
- {
2
- "data": {
3
- "filter_length": 2048,
4
- "hop_length": 400,
5
- "max_wav_value": 32768.0,
6
- "mel_fmax": null,
7
- "mel_fmin": 0.0,
8
- "n_mel_channels": 125,
9
- "sampling_rate": 40000,
10
- "win_length": 2048
11
- },
12
- "model": {
13
- "filter_channels": 768,
14
- "gin_channels": 256,
15
- "hidden_channels": 192,
16
- "inter_channels": 192,
17
- "kernel_size": 3,
18
- "n_heads": 2,
19
- "n_layers": 6,
20
- "p_dropout": 0,
21
- "resblock": "1",
22
- "resblock_dilation_sizes": [
23
- [
24
- 1,
25
- 3,
26
- 5
27
- ],
28
- [
29
- 1,
30
- 3,
31
- 5
32
- ],
33
- [
34
- 1,
35
- 3,
36
- 5
37
- ]
38
- ],
39
- "resblock_kernel_sizes": [
40
- 3,
41
- 7,
42
- 11
43
- ],
44
- "spk_embed_dim": 109,
45
- "upsample_initial_channel": 512,
46
- "upsample_kernel_sizes": [
47
- 16,
48
- 16,
49
- 4,
50
- 4
51
- ],
52
- "upsample_rates": [
53
- 10,
54
- 10,
55
- 2,
56
- 2
57
- ],
58
- "use_spectral_norm": false
59
- },
60
- "train": {
61
- "batch_size": 4,
62
- "betas": [
63
- 0.8,
64
- 0.99
65
- ],
66
- "c_kl": 1.0,
67
- "c_mel": 45,
68
- "epochs": 20000,
69
- "eps": 1e-09,
70
- "fp16_run": true,
71
- "init_lr_ratio": 1,
72
- "learning_rate": 0.0001,
73
- "log_interval": 200,
74
- "lr_decay": 0.999875,
75
- "seed": 1234,
76
- "segment_size": 12800,
77
- "warmup_epochs": 0
78
- }
79
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Eve_v2/Eve_v2.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:ef6a27cd4c4b51711a9285ef086d768fde25e6f7cf8cce6e6c4f8f971800aabf
3
- size 55222767
 
 
 
 
Eve_v2/added_IVF256_Flat_nprobe_1_Eve_v2_v2.index DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:708b2c8a92e08ed8cfbbd2aabbe0f07d1c82135ca9e6b26790175bcf06b8c64a
3
- size 31588619
 
 
 
 
Eve_v2/config.json DELETED
@@ -1,79 +0,0 @@
1
- {
2
- "data": {
3
- "filter_length": 2048,
4
- "hop_length": 400,
5
- "max_wav_value": 32768.0,
6
- "mel_fmax": null,
7
- "mel_fmin": 0.0,
8
- "n_mel_channels": 125,
9
- "sampling_rate": 40000,
10
- "win_length": 2048
11
- },
12
- "model": {
13
- "filter_channels": 768,
14
- "gin_channels": 256,
15
- "hidden_channels": 192,
16
- "inter_channels": 192,
17
- "kernel_size": 3,
18
- "n_heads": 2,
19
- "n_layers": 6,
20
- "p_dropout": 0,
21
- "resblock": "1",
22
- "resblock_dilation_sizes": [
23
- [
24
- 1,
25
- 3,
26
- 5
27
- ],
28
- [
29
- 1,
30
- 3,
31
- 5
32
- ],
33
- [
34
- 1,
35
- 3,
36
- 5
37
- ]
38
- ],
39
- "resblock_kernel_sizes": [
40
- 3,
41
- 7,
42
- 11
43
- ],
44
- "spk_embed_dim": 109,
45
- "upsample_initial_channel": 512,
46
- "upsample_kernel_sizes": [
47
- 16,
48
- 16,
49
- 4,
50
- 4
51
- ],
52
- "upsample_rates": [
53
- 10,
54
- 10,
55
- 2,
56
- 2
57
- ],
58
- "use_spectral_norm": false
59
- },
60
- "train": {
61
- "batch_size": 4,
62
- "betas": [
63
- 0.8,
64
- 0.99
65
- ],
66
- "c_kl": 1.0,
67
- "c_mel": 45,
68
- "epochs": 20000,
69
- "eps": 1e-09,
70
- "fp16_run": true,
71
- "init_lr_ratio": 1,
72
- "learning_rate": 0.0001,
73
- "log_interval": 200,
74
- "lr_decay": 0.999875,
75
- "seed": 1234,
76
- "segment_size": 12800,
77
- "warmup_epochs": 0
78
- }
79
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
HiromachiNanami_v2/HiromachiNanami_v2.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:e62037a3e7bc9fd852401e250e05344a88bcb9f529f20e4a0b4c9f9382003a70
3
- size 55222767
 
 
 
 
HiromachiNanami_v2/added_IVF256_Flat_nprobe_1_HiromachiNanami_v2_v2.index DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:ad8b5f631be16d6351963eb54e49e924188ccb8a373db75a04332ab2f83b05fe
3
- size 31588619
 
 
 
 
HiromachiNanami_v2/config.json DELETED
@@ -1,79 +0,0 @@
1
- {
2
- "data": {
3
- "filter_length": 2048,
4
- "hop_length": 400,
5
- "max_wav_value": 32768.0,
6
- "mel_fmax": null,
7
- "mel_fmin": 0.0,
8
- "n_mel_channels": 125,
9
- "sampling_rate": 40000,
10
- "win_length": 2048
11
- },
12
- "model": {
13
- "filter_channels": 768,
14
- "gin_channels": 256,
15
- "hidden_channels": 192,
16
- "inter_channels": 192,
17
- "kernel_size": 3,
18
- "n_heads": 2,
19
- "n_layers": 6,
20
- "p_dropout": 0,
21
- "resblock": "1",
22
- "resblock_dilation_sizes": [
23
- [
24
- 1,
25
- 3,
26
- 5
27
- ],
28
- [
29
- 1,
30
- 3,
31
- 5
32
- ],
33
- [
34
- 1,
35
- 3,
36
- 5
37
- ]
38
- ],
39
- "resblock_kernel_sizes": [
40
- 3,
41
- 7,
42
- 11
43
- ],
44
- "spk_embed_dim": 109,
45
- "upsample_initial_channel": 512,
46
- "upsample_kernel_sizes": [
47
- 16,
48
- 16,
49
- 4,
50
- 4
51
- ],
52
- "upsample_rates": [
53
- 10,
54
- 10,
55
- 2,
56
- 2
57
- ],
58
- "use_spectral_norm": false
59
- },
60
- "train": {
61
- "batch_size": 4,
62
- "betas": [
63
- 0.8,
64
- 0.99
65
- ],
66
- "c_kl": 1.0,
67
- "c_mel": 45,
68
- "epochs": 20000,
69
- "eps": 1e-09,
70
- "fp16_run": true,
71
- "init_lr_ratio": 1,
72
- "learning_rate": 0.0001,
73
- "log_interval": 200,
74
- "lr_decay": 0.999875,
75
- "seed": 1234,
76
- "segment_size": 12800,
77
- "warmup_epochs": 0
78
- }
79
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Kanon_v2/Kanon_v2.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:353f0c56b4e6a991f315f3a87487c12781d03981bc74c2084849b99806527d6a
3
- size 55222767
 
 
 
 
Kanon_v2/added_IVF256_Flat_nprobe_1_Kanon_v2_v2.index DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:5bea0c84233806a33d2f91e0a2a3fce18ea340727d2577cba90ed7ef9b0b0bde
3
- size 31588619
 
 
 
 
Kanon_v2/config.json DELETED
@@ -1,79 +0,0 @@
1
- {
2
- "data": {
3
- "filter_length": 2048,
4
- "hop_length": 400,
5
- "max_wav_value": 32768.0,
6
- "mel_fmax": null,
7
- "mel_fmin": 0.0,
8
- "n_mel_channels": 125,
9
- "sampling_rate": 40000,
10
- "win_length": 2048
11
- },
12
- "model": {
13
- "filter_channels": 768,
14
- "gin_channels": 256,
15
- "hidden_channels": 192,
16
- "inter_channels": 192,
17
- "kernel_size": 3,
18
- "n_heads": 2,
19
- "n_layers": 6,
20
- "p_dropout": 0,
21
- "resblock": "1",
22
- "resblock_dilation_sizes": [
23
- [
24
- 1,
25
- 3,
26
- 5
27
- ],
28
- [
29
- 1,
30
- 3,
31
- 5
32
- ],
33
- [
34
- 1,
35
- 3,
36
- 5
37
- ]
38
- ],
39
- "resblock_kernel_sizes": [
40
- 3,
41
- 7,
42
- 11
43
- ],
44
- "spk_embed_dim": 109,
45
- "upsample_initial_channel": 512,
46
- "upsample_kernel_sizes": [
47
- 16,
48
- 16,
49
- 4,
50
- 4
51
- ],
52
- "upsample_rates": [
53
- 10,
54
- 10,
55
- 2,
56
- 2
57
- ],
58
- "use_spectral_norm": false
59
- },
60
- "train": {
61
- "batch_size": 4,
62
- "betas": [
63
- 0.8,
64
- 0.99
65
- ],
66
- "c_kl": 1.0,
67
- "c_mel": 45,
68
- "epochs": 20000,
69
- "eps": 1e-09,
70
- "fp16_run": true,
71
- "init_lr_ratio": 1,
72
- "learning_rate": 0.0001,
73
- "log_interval": 200,
74
- "lr_decay": 0.999875,
75
- "seed": 1234,
76
- "segment_size": 12800,
77
- "warmup_epochs": 0
78
- }
79
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Mashiro_v2/Mashiro_v2.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:085684ccd0de538e790fc5dc648b16de2786342c845a428f2a83bbe3c5dfd23f
3
- size 55222767
 
 
 
 
Mashiro_v2/added_IVF256_Flat_nprobe_1_Mashiro_v2_v2.index DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:8fb21a3418587ab247cd384282e9986066376e7dccc41988b5c63324654e2ace
3
- size 31588619
 
 
 
 
Mashiro_v2/config.json DELETED
@@ -1,79 +0,0 @@
1
- {
2
- "data": {
3
- "filter_length": 2048,
4
- "hop_length": 400,
5
- "max_wav_value": 32768.0,
6
- "mel_fmax": null,
7
- "mel_fmin": 0.0,
8
- "n_mel_channels": 125,
9
- "sampling_rate": 40000,
10
- "win_length": 2048
11
- },
12
- "model": {
13
- "filter_channels": 768,
14
- "gin_channels": 256,
15
- "hidden_channels": 192,
16
- "inter_channels": 192,
17
- "kernel_size": 3,
18
- "n_heads": 2,
19
- "n_layers": 6,
20
- "p_dropout": 0,
21
- "resblock": "1",
22
- "resblock_dilation_sizes": [
23
- [
24
- 1,
25
- 3,
26
- 5
27
- ],
28
- [
29
- 1,
30
- 3,
31
- 5
32
- ],
33
- [
34
- 1,
35
- 3,
36
- 5
37
- ]
38
- ],
39
- "resblock_kernel_sizes": [
40
- 3,
41
- 7,
42
- 11
43
- ],
44
- "spk_embed_dim": 109,
45
- "upsample_initial_channel": 512,
46
- "upsample_kernel_sizes": [
47
- 16,
48
- 16,
49
- 4,
50
- 4
51
- ],
52
- "upsample_rates": [
53
- 10,
54
- 10,
55
- 2,
56
- 2
57
- ],
58
- "use_spectral_norm": false
59
- },
60
- "train": {
61
- "batch_size": 4,
62
- "betas": [
63
- 0.8,
64
- 0.99
65
- ],
66
- "c_kl": 1.0,
67
- "c_mel": 45,
68
- "epochs": 20000,
69
- "eps": 1e-09,
70
- "fp16_run": true,
71
- "init_lr_ratio": 1,
72
- "learning_rate": 0.0001,
73
- "log_interval": 200,
74
- "lr_decay": 0.999875,
75
- "seed": 1234,
76
- "segment_size": 12800,
77
- "warmup_epochs": 0
78
- }
79
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Maya_v2/Maya_v2.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:51f7922475a94e858b86eb9bd8dd41d7e10e785f808a4ac6731fe079af7fe393
3
- size 55222767
 
 
 
 
Maya_v2/added_IVF256_Flat_nprobe_1_Maya_v2_v2.index DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:f6df045277c31b75270e27fd15381eb5ba0b6aa81c7c1642c0899f3348954f08
3
- size 31588619
 
 
 
 
Maya_v2/config.json DELETED
@@ -1,79 +0,0 @@
1
- {
2
- "data": {
3
- "filter_length": 2048,
4
- "hop_length": 400,
5
- "max_wav_value": 32768.0,
6
- "mel_fmax": null,
7
- "mel_fmin": 0.0,
8
- "n_mel_channels": 125,
9
- "sampling_rate": 40000,
10
- "win_length": 2048
11
- },
12
- "model": {
13
- "filter_channels": 768,
14
- "gin_channels": 256,
15
- "hidden_channels": 192,
16
- "inter_channels": 192,
17
- "kernel_size": 3,
18
- "n_heads": 2,
19
- "n_layers": 6,
20
- "p_dropout": 0,
21
- "resblock": "1",
22
- "resblock_dilation_sizes": [
23
- [
24
- 1,
25
- 3,
26
- 5
27
- ],
28
- [
29
- 1,
30
- 3,
31
- 5
32
- ],
33
- [
34
- 1,
35
- 3,
36
- 5
37
- ]
38
- ],
39
- "resblock_kernel_sizes": [
40
- 3,
41
- 7,
42
- 11
43
- ],
44
- "spk_embed_dim": 109,
45
- "upsample_initial_channel": 512,
46
- "upsample_kernel_sizes": [
47
- 16,
48
- 16,
49
- 4,
50
- 4
51
- ],
52
- "upsample_rates": [
53
- 10,
54
- 10,
55
- 2,
56
- 2
57
- ],
58
- "use_spectral_norm": false
59
- },
60
- "train": {
61
- "batch_size": 4,
62
- "betas": [
63
- 0.8,
64
- 0.99
65
- ],
66
- "c_kl": 1.0,
67
- "c_mel": 45,
68
- "epochs": 20000,
69
- "eps": 1e-09,
70
- "fp16_run": true,
71
- "init_lr_ratio": 1,
72
- "learning_rate": 0.0001,
73
- "log_interval": 200,
74
- "lr_decay": 0.999875,
75
- "seed": 1234,
76
- "segment_size": 12800,
77
- "warmup_epochs": 0
78
- }
79
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Rinko1_v2/Rinko1_v2.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ed2bfcc360bf43564098ed5b85a963ceddf9cc71cd8abc91bc9d59fac9dc4ee
3
- size 55222767
 
 
 
 
Rinko1_v2/added_IVF256_Flat_nprobe_1_Rinko1_v2_v2.index DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:f837795d36f9b5d98a961a605dea8fff5ea30dcb6f71072e398272a69c27fa9d
3
- size 31588619
 
 
 
 
Rinko1_v2/config.json DELETED
@@ -1,79 +0,0 @@
1
- {
2
- "data": {
3
- "filter_length": 2048,
4
- "hop_length": 400,
5
- "max_wav_value": 32768.0,
6
- "mel_fmax": null,
7
- "mel_fmin": 0.0,
8
- "n_mel_channels": 125,
9
- "sampling_rate": 40000,
10
- "win_length": 2048
11
- },
12
- "model": {
13
- "filter_channels": 768,
14
- "gin_channels": 256,
15
- "hidden_channels": 192,
16
- "inter_channels": 192,
17
- "kernel_size": 3,
18
- "n_heads": 2,
19
- "n_layers": 6,
20
- "p_dropout": 0,
21
- "resblock": "1",
22
- "resblock_dilation_sizes": [
23
- [
24
- 1,
25
- 3,
26
- 5
27
- ],
28
- [
29
- 1,
30
- 3,
31
- 5
32
- ],
33
- [
34
- 1,
35
- 3,
36
- 5
37
- ]
38
- ],
39
- "resblock_kernel_sizes": [
40
- 3,
41
- 7,
42
- 11
43
- ],
44
- "spk_embed_dim": 109,
45
- "upsample_initial_channel": 512,
46
- "upsample_kernel_sizes": [
47
- 16,
48
- 16,
49
- 4,
50
- 4
51
- ],
52
- "upsample_rates": [
53
- 10,
54
- 10,
55
- 2,
56
- 2
57
- ],
58
- "use_spectral_norm": false
59
- },
60
- "train": {
61
- "batch_size": 4,
62
- "betas": [
63
- 0.8,
64
- 0.99
65
- ],
66
- "c_kl": 1.0,
67
- "c_mel": 45,
68
- "epochs": 20000,
69
- "eps": 1e-09,
70
- "fp16_run": true,
71
- "init_lr_ratio": 1,
72
- "learning_rate": 0.0001,
73
- "log_interval": 200,
74
- "lr_decay": 0.999875,
75
- "seed": 1234,
76
- "segment_size": 12800,
77
- "warmup_epochs": 0
78
- }
79
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Rui_v2/Rui_v2.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:865d65d30e74669d3c1cd7f08e907b4ac1edbf69212fade3b1595ff1d82e0a40
3
- size 55222767
 
 
 
 
Rui_v2/added_IVF256_Flat_nprobe_1_Rui_v2_v2.index DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:a148b8feec79918a0cc0d42b14b30f9fc65406c047b2990b4642dfd536721633
3
- size 31588619
 
 
 
 
Rui_v2/config.json DELETED
@@ -1,79 +0,0 @@
1
- {
2
- "data": {
3
- "filter_length": 2048,
4
- "hop_length": 400,
5
- "max_wav_value": 32768.0,
6
- "mel_fmax": null,
7
- "mel_fmin": 0.0,
8
- "n_mel_channels": 125,
9
- "sampling_rate": 40000,
10
- "win_length": 2048
11
- },
12
- "model": {
13
- "filter_channels": 768,
14
- "gin_channels": 256,
15
- "hidden_channels": 192,
16
- "inter_channels": 192,
17
- "kernel_size": 3,
18
- "n_heads": 2,
19
- "n_layers": 6,
20
- "p_dropout": 0,
21
- "resblock": "1",
22
- "resblock_dilation_sizes": [
23
- [
24
- 1,
25
- 3,
26
- 5
27
- ],
28
- [
29
- 1,
30
- 3,
31
- 5
32
- ],
33
- [
34
- 1,
35
- 3,
36
- 5
37
- ]
38
- ],
39
- "resblock_kernel_sizes": [
40
- 3,
41
- 7,
42
- 11
43
- ],
44
- "spk_embed_dim": 109,
45
- "upsample_initial_channel": 512,
46
- "upsample_kernel_sizes": [
47
- 16,
48
- 16,
49
- 4,
50
- 4
51
- ],
52
- "upsample_rates": [
53
- 10,
54
- 10,
55
- 2,
56
- 2
57
- ],
58
- "use_spectral_norm": false
59
- },
60
- "train": {
61
- "batch_size": 4,
62
- "betas": [
63
- 0.8,
64
- 0.99
65
- ],
66
- "c_kl": 1.0,
67
- "c_mel": 45,
68
- "epochs": 20000,
69
- "eps": 1e-09,
70
- "fp16_run": true,
71
- "init_lr_ratio": 1,
72
- "learning_rate": 0.0001,
73
- "log_interval": 200,
74
- "lr_decay": 0.999875,
75
- "seed": 1234,
76
- "segment_size": 12800,
77
- "warmup_epochs": 0
78
- }
79
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Toko_v2/Toko_v2.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:befcf40285d8dbac6085c45c24d345f4a22ff69503b8852be8984f653f3ae4c6
3
- size 55222767
 
 
 
 
Toko_v2/added_IVF256_Flat_nprobe_1_Toko_v2_v2.index DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:e6a9c3a609a3352ce7a4ceb994b5f11c35de39e71a031cca722b0f95f2d179b4
3
- size 31588619
 
 
 
 
Toko_v2/config.json DELETED
@@ -1,79 +0,0 @@
1
- {
2
- "data": {
3
- "filter_length": 2048,
4
- "hop_length": 400,
5
- "max_wav_value": 32768.0,
6
- "mel_fmax": null,
7
- "mel_fmin": 0.0,
8
- "n_mel_channels": 125,
9
- "sampling_rate": 40000,
10
- "win_length": 2048
11
- },
12
- "model": {
13
- "filter_channels": 768,
14
- "gin_channels": 256,
15
- "hidden_channels": 192,
16
- "inter_channels": 192,
17
- "kernel_size": 3,
18
- "n_heads": 2,
19
- "n_layers": 6,
20
- "p_dropout": 0,
21
- "resblock": "1",
22
- "resblock_dilation_sizes": [
23
- [
24
- 1,
25
- 3,
26
- 5
27
- ],
28
- [
29
- 1,
30
- 3,
31
- 5
32
- ],
33
- [
34
- 1,
35
- 3,
36
- 5
37
- ]
38
- ],
39
- "resblock_kernel_sizes": [
40
- 3,
41
- 7,
42
- 11
43
- ],
44
- "spk_embed_dim": 109,
45
- "upsample_initial_channel": 512,
46
- "upsample_kernel_sizes": [
47
- 16,
48
- 16,
49
- 4,
50
- 4
51
- ],
52
- "upsample_rates": [
53
- 10,
54
- 10,
55
- 2,
56
- 2
57
- ],
58
- "use_spectral_norm": false
59
- },
60
- "train": {
61
- "batch_size": 4,
62
- "betas": [
63
- 0.8,
64
- 0.99
65
- ],
66
- "c_kl": 1.0,
67
- "c_mel": 45,
68
- "epochs": 20000,
69
- "eps": 1e-09,
70
- "fp16_run": true,
71
- "init_lr_ratio": 1,
72
- "learning_rate": 0.0001,
73
- "log_interval": 200,
74
- "lr_decay": 0.999875,
75
- "seed": 1234,
76
- "segment_size": 12800,
77
- "warmup_epochs": 0
78
- }
79
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Tsugumi_v2/Tsugumi_v2.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:173aa530db9fd26665772d28c4fdf035650f03a8e5bc33fbe79066a2635ebf4a
3
- size 55222767
 
 
 
 
Tsugumi_v2/added_IVF256_Flat_nprobe_1_Tsugumi_v2_v2.index DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:e3f562972ba599541483d9ec7c7a81c67291328544a6e3945be54cea2b551fcc
3
- size 31588619
 
 
 
 
Tsugumi_v2/config.json DELETED
@@ -1,79 +0,0 @@
1
- {
2
- "data": {
3
- "filter_length": 2048,
4
- "hop_length": 400,
5
- "max_wav_value": 32768.0,
6
- "mel_fmax": null,
7
- "mel_fmin": 0.0,
8
- "n_mel_channels": 125,
9
- "sampling_rate": 40000,
10
- "win_length": 2048
11
- },
12
- "model": {
13
- "filter_channels": 768,
14
- "gin_channels": 256,
15
- "hidden_channels": 192,
16
- "inter_channels": 192,
17
- "kernel_size": 3,
18
- "n_heads": 2,
19
- "n_layers": 6,
20
- "p_dropout": 0,
21
- "resblock": "1",
22
- "resblock_dilation_sizes": [
23
- [
24
- 1,
25
- 3,
26
- 5
27
- ],
28
- [
29
- 1,
30
- 3,
31
- 5
32
- ],
33
- [
34
- 1,
35
- 3,
36
- 5
37
- ]
38
- ],
39
- "resblock_kernel_sizes": [
40
- 3,
41
- 7,
42
- 11
43
- ],
44
- "spk_embed_dim": 109,
45
- "upsample_initial_channel": 512,
46
- "upsample_kernel_sizes": [
47
- 16,
48
- 16,
49
- 4,
50
- 4
51
- ],
52
- "upsample_rates": [
53
- 10,
54
- 10,
55
- 2,
56
- 2
57
- ],
58
- "use_spectral_norm": false
59
- },
60
- "train": {
61
- "batch_size": 4,
62
- "betas": [
63
- 0.8,
64
- 0.99
65
- ],
66
- "c_kl": 1.0,
67
- "c_mel": 45,
68
- "epochs": 20000,
69
- "eps": 1e-09,
70
- "fp16_run": true,
71
- "init_lr_ratio": 1,
72
- "learning_rate": 0.0001,
73
- "log_interval": 200,
74
- "lr_decay": 0.999875,
75
- "seed": 1234,
76
- "segment_size": 12800,
77
- "warmup_epochs": 0
78
- }
79
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Tsukushi_v2/Tsukushi_v2.pth DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:a88c0c70c086237727e474a1457df03984852751324ed89a851ef4fea989818c
3
- size 55222767
 
 
 
 
Tsukushi_v2/added_IVF256_Flat_nprobe_1_Tsukushi_v2_v2.index DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:3cc38460dbfeca1b437c9915655e3b0b3f8e12b2911843e17a59ff0a986226ca
3
- size 31588619
 
 
 
 
Tsukushi_v2/config.json DELETED
@@ -1,79 +0,0 @@
1
- {
2
- "data": {
3
- "filter_length": 2048,
4
- "hop_length": 400,
5
- "max_wav_value": 32768.0,
6
- "mel_fmax": null,
7
- "mel_fmin": 0.0,
8
- "n_mel_channels": 125,
9
- "sampling_rate": 40000,
10
- "win_length": 2048
11
- },
12
- "model": {
13
- "filter_channels": 768,
14
- "gin_channels": 256,
15
- "hidden_channels": 192,
16
- "inter_channels": 192,
17
- "kernel_size": 3,
18
- "n_heads": 2,
19
- "n_layers": 6,
20
- "p_dropout": 0,
21
- "resblock": "1",
22
- "resblock_dilation_sizes": [
23
- [
24
- 1,
25
- 3,
26
- 5
27
- ],
28
- [
29
- 1,
30
- 3,
31
- 5
32
- ],
33
- [
34
- 1,
35
- 3,
36
- 5
37
- ]
38
- ],
39
- "resblock_kernel_sizes": [
40
- 3,
41
- 7,
42
- 11
43
- ],
44
- "spk_embed_dim": 109,
45
- "upsample_initial_channel": 512,
46
- "upsample_kernel_sizes": [
47
- 16,
48
- 16,
49
- 4,
50
- 4
51
- ],
52
- "upsample_rates": [
53
- 10,
54
- 10,
55
- 2,
56
- 2
57
- ],
58
- "use_spectral_norm": false
59
- },
60
- "train": {
61
- "batch_size": 4,
62
- "betas": [
63
- 0.8,
64
- 0.99
65
- ],
66
- "c_kl": 1.0,
67
- "c_mel": 45,
68
- "epochs": 20000,
69
- "eps": 1e-09,
70
- "fp16_run": true,
71
- "init_lr_ratio": 1,
72
- "learning_rate": 0.0001,
73
- "log_interval": 200,
74
- "lr_decay": 0.999875,
75
- "seed": 1234,
76
- "segment_size": 12800,
77
- "warmup_epochs": 0
78
- }
79
- }