ryota-komatsu commited on
Commit
0b9f0b9
1 Parent(s): c292c96

Upload 22 files

Browse files
.gitattributes CHANGED
@@ -33,3 +33,9 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ models/byol_tgt_layer_6/checkpoint filter=lfs diff=lfs merge=lfs -text
37
+ models/byol/checkpoint filter=lfs diff=lfs merge=lfs -text
38
+ models/byol/checkpoint_sid filter=lfs diff=lfs merge=lfs -text
39
+ models/dino/checkpoint filter=lfs diff=lfs merge=lfs -text
40
+ models/hubert/checkpoint_sid filter=lfs diff=lfs merge=lfs -text
41
+ models/vg-hubert_3/checkpoint_sid filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: mit
3
+ datasets:
4
+ - openslr/librispeech_asr
5
+ language:
6
+ - en
7
+ ---
8
+
9
+ # Self-Supervised Syllable Discovery Based on Speaker-Disentangled HuBERT
10
+
11
+ This is the official model repository of [a GitHub project](https://github.com/ryota-komatsu/speaker_disentangled_hubert).
models/byol/checkpoint ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a615c08753d835e1b45960c2c8d5723bd1e9186a9749bd3e637aa6f5d2f0ced
3
+ size 1444845288
models/byol/checkpoint_sid ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46e3da2370c3fd40f30ad0cd7977e197aeacc4f9d483aacbc3895ba242b9a47d
3
+ size 383784814
models/byol/quantizer1.joblib ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c329cacd4f3f84387e6a16b623935082e330f3e45e0068fc79029935af4ae1d
3
+ size 50398058
models/byol/quantizer2.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c77213ed62a78b046e0267baad2f575b68fa6a979dfced83ab83537965f56a33
3
+ size 131200
models/byol_tgt_layer_6/checkpoint ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:113dbcb3b7bf5605465c9c5523b7123fef13561f9ec73ac1421d3b01e7d7b069
3
+ size 1457428200
models/byol_tgt_layer_6/quantizer1.joblib ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2536bade704d94ce9d761330c6201fc78483e1c58f89ed8d0d547d458e279c8
3
+ size 50398058
models/byol_tgt_layer_6/quantizer2.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6ebc267396f21ba9a60c2f8abce3044988edd4c3ecfca7ae654f4a119967634
3
+ size 131200
models/dino/checkpoint ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d074285e61d15e8eb49ffa81be7061eb04568896d1dfb11c91c907ee603d49e
3
+ size 1516041480
models/dino/quantizer1.joblib ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb4199b374ea13b20a145d5d4123a728f6933c0fa1accabdedaa8f492628726a
3
+ size 50398058
models/dino/quantizer2.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0e7347fd57e478a9e228e546f150cd3f2591999ac408d74087218f632354cc3
3
+ size 131200
models/hubert/checkpoint_sid ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2562f5d5c0c8aee8559f3bf1f64c55b8564242ebde01801293897d58b62fcd8b
3
+ size 383784814
models/hubert/quantizer1.joblib ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:730d7408a8f48d91185eadee509a39ad93bfc9b799b524c4890a4371e8b0e5f8
3
+ size 50398058
models/hubert/quantizer2.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62db8041c381d3e26caeb429d53edfa59f7c385a7d097b0532a7b19b445aa810
3
+ size 131200
models/vg-hubert_3/checkpoint_sid ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8be075bab4362d94f8cc14d4603532a126174885fa6aca14ba59da17cdb460b
3
+ size 383781359
models/vg-hubert_3/quantizer1.joblib ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e30a79b1273298b09b3d08671bb635270b15532d7601eba61bd695142e0ce853
3
+ size 50398058
models/vg-hubert_3/quantizer2.npy ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6cfbb8dda51794e2630d3d26d3fc91a577c84335933401b0c0c66107c608cf58
3
+ size 131200
results/byol.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "segmentation": {
3
+ "match_gt": 110641,
4
+ "match_pred": 110641,
5
+ "gt_len": 163763,
6
+ "pred_len": 150931,
7
+ "prec": 0.7330568272919413,
8
+ "recall": 0.6756165922705373,
9
+ "f1": 0.7031656148512523,
10
+ "os": -0.07835713805926858,
11
+ "r1": 0.3337131047696781,
12
+ "r2": -0.1739668436338245,
13
+ "r_val": 0.7461600257982487
14
+ },
15
+ "clustering": {
16
+ "syllable_purity": 0.5935364727608494,
17
+ "cluster_purity": 0.4447403934938561,
18
+ "mutual_info": 5.07649445946761
19
+ }
20
+ }
results/byol_tgt_layer_6.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "segmentation": {
3
+ "match_gt": 37215,
4
+ "match_pred": 37215,
5
+ "gt_len": 163763,
6
+ "pred_len": 81606,
7
+ "prec": 0.456032644658481,
8
+ "recall": 0.22724913441986286,
9
+ "f1": 0.303339052610558,
10
+ "os": -0.5016823091907208,
11
+ "r1": 0.9213191844359832,
12
+ "r2": -0.19167441438940436,
13
+ "r_val": 0.4435032005873063
14
+ },
15
+ "clustering": {
16
+ "syllable_purity": 0.10408265804357068,
17
+ "cluster_purity": 0.1427706419654475,
18
+ "mutual_info": 2.166068535065666
19
+ }
20
+ }
results/dino.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "segmentation": {
3
+ "match_gt": 106629,
4
+ "match_pred": 106629,
5
+ "gt_len": 163763,
6
+ "pred_len": 165706,
7
+ "prec": 0.6434830362207765,
8
+ "recall": 0.6511177738561214,
9
+ "f1": 0.6472778926090162,
10
+ "os": 0.011864706924030521,
11
+ "r1": 0.34908391396554156,
12
+ "r2": -0.2550866026645681,
13
+ "r_val": 0.6979147416849452
14
+ },
15
+ "clustering": {
16
+ "syllable_purity": 0.590599474096453,
17
+ "cluster_purity": 0.42873727201521766,
18
+ "mutual_info": 5.060749923481224
19
+ }
20
+ }
results/hubert.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "segmentation": {
3
+ "match_gt": 51481,
4
+ "match_pred": 51481,
5
+ "gt_len": 163763,
6
+ "pred_len": 100135,
7
+ "prec": 0.514115943476307,
8
+ "recall": 0.3143628292105054,
9
+ "f1": 0.39015831874436335,
10
+ "os": -0.38853709323839936,
11
+ "r1": 0.7880732217188751,
12
+ "r2": -0.2100814795274286,
13
+ "r_val": 0.5009226493768482
14
+ },
15
+ "clustering": {
16
+ "syllable_purity": 0.33106618025927986,
17
+ "cluster_purity": 0.28381664914775656,
18
+ "mutual_info": 3.5403592325037194
19
+ }
20
+ }
results/vg-hubert_3.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "segmentation": {
3
+ "match_gt": 105266,
4
+ "match_pred": 105266,
5
+ "gt_len": 163763,
6
+ "pred_len": 161292,
7
+ "prec": 0.6526424125189098,
8
+ "recall": 0.6427947704915029,
9
+ "f1": 0.6476811616495669,
10
+ "os": -0.015088878440184916,
11
+ "r1": 0.357523775769949,
12
+ "r2": -0.2419127917952011,
13
+ "r_val": 0.700281716217425
14
+ },
15
+ "clustering": {
16
+ "syllable_purity": 0.534248207514771,
17
+ "cluster_purity": 0.4357403682391943,
18
+ "mutual_info": 4.6595905283191055
19
+ }
20
+ }