meg-huggingface commited on
Commit
b28e93b
2 Parent(s): e530aff adb962b

Merge branch 'main' of https://huggingface.co/spaces/huggingface/data-measurements-tool-2 into main

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. cache_dir/bak/general_stats.json +3 -0
  2. cache_dir/c4_en.noblocklist_train_text/dset_peek.json +3 -0
  3. cache_dir/c4_en.noblocklist_train_text/dup_counts_df.feather +3 -0
  4. cache_dir/c4_en.noblocklist_train_text/fig_tok_length.json +3 -0
  5. cache_dir/c4_en.noblocklist_train_text/general_stats_dict.json +3 -0
  6. cache_dir/c4_en.noblocklist_train_text/length_df.feather +3 -0
  7. cache_dir/c4_en.noblocklist_train_text/length_stats.json +3 -0
  8. cache_dir/c4_en.noblocklist_train_text/npmi_terms.json +3 -0
  9. cache_dir/c4_en.noblocklist_train_text/pmi_files/gay-lesbian_npmi.csv +3 -0
  10. cache_dir/c4_en.noblocklist_train_text/pmi_files/gay-man_npmi.csv +3 -0
  11. cache_dir/c4_en.noblocklist_train_text/pmi_files/gay_npmi.csv +3 -0
  12. cache_dir/c4_en.noblocklist_train_text/pmi_files/gay_pmi.csv +3 -0
  13. cache_dir/c4_en.noblocklist_train_text/pmi_files/gay_vocab_cooc.csv +3 -0
  14. cache_dir/c4_en.noblocklist_train_text/pmi_files/lesbian_npmi.csv +3 -0
  15. cache_dir/c4_en.noblocklist_train_text/pmi_files/lesbian_pmi.csv +3 -0
  16. cache_dir/c4_en.noblocklist_train_text/pmi_files/lesbian_vocab_cooc.csv +3 -0
  17. cache_dir/c4_en.noblocklist_train_text/pmi_files/man-woman_npmi.csv +3 -0
  18. cache_dir/c4_en.noblocklist_train_text/pmi_files/man_npmi.csv +3 -0
  19. cache_dir/c4_en.noblocklist_train_text/pmi_files/man_pmi.csv +3 -0
  20. cache_dir/c4_en.noblocklist_train_text/pmi_files/man_vocab_cooc.csv +3 -0
  21. cache_dir/c4_en.noblocklist_train_text/pmi_files/woman_npmi.csv +3 -0
  22. cache_dir/c4_en.noblocklist_train_text/pmi_files/woman_pmi.csv +3 -0
  23. cache_dir/c4_en.noblocklist_train_text/pmi_files/woman_vocab_cooc.csv +3 -0
  24. cache_dir/c4_en.noblocklist_train_text/sorted_top_vocab.feather +3 -0
  25. cache_dir/c4_en.noblocklist_train_text/text_dset/dataset.arrow +3 -0
  26. cache_dir/c4_en.noblocklist_train_text/text_dset/dataset_info.json +3 -0
  27. cache_dir/c4_en.noblocklist_train_text/text_dset/state.json +3 -0
  28. cache_dir/c4_en.noblocklist_train_text/vocab_counts.feather +3 -0
  29. cache_dir/glue_cola_train_sentence/dset_peek.json +3 -0
  30. cache_dir/glue_cola_validation_sentence/dset_peek.json +3 -0
  31. cache_dir/glue_mnli_matched_validation_hypothesis/dset_peek.json +3 -0
  32. cache_dir/glue_mnli_matched_validation_premise/dset_peek.json +3 -0
  33. cache_dir/glue_mnli_mismatched_validation_hypothesis/dset_peek.json +3 -0
  34. cache_dir/glue_mnli_mismatched_validation_premise/dset_peek.json +3 -0
  35. cache_dir/glue_mnli_train_hypothesis/dset_peek.json +3 -0
  36. cache_dir/glue_mnli_train_premise/dset_peek.json +3 -0
  37. cache_dir/glue_mnli_validation_matched_hypothesis/dset_peek.json +3 -0
  38. cache_dir/glue_mnli_validation_matched_premise/dset_peek.json +3 -0
  39. cache_dir/glue_mnli_validation_mismatched_hypothesis/dset_peek.json +3 -0
  40. cache_dir/glue_mnli_validation_mismatched_premise/dset_peek.json +3 -0
  41. cache_dir/glue_mrpc_train_sentence1/dset_peek.json +3 -0
  42. cache_dir/glue_mrpc_train_sentence2/dset_peek.json +3 -0
  43. cache_dir/glue_mrpc_validation_sentence1/dset_peek.json +3 -0
  44. cache_dir/glue_mrpc_validation_sentence2/dset_peek.json +3 -0
  45. cache_dir/glue_qnli_train_question/dset_peek.json +3 -0
  46. cache_dir/glue_qnli_train_sentence/dset_peek.json +3 -0
  47. cache_dir/glue_qnli_validation_question/dset_peek.json +3 -0
  48. cache_dir/glue_qnli_validation_sentence/dset_peek.json +3 -0
  49. cache_dir/glue_qqp_train_question1/dset_peek.json +3 -0
  50. cache_dir/glue_qqp_train_question2/dset_peek.json +3 -0
cache_dir/bak/general_stats.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12d04e38e33a11933b5689d4e2afc9a3742633b9a1ae0e607abd37c6dc3635fb
3
+ size 39
cache_dir/c4_en.noblocklist_train_text/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b73791ca5a24b71cb9c947f2ba19ce44459c6bd1cbef494bac8abb52ef25ea7c
3
+ size 259923
cache_dir/c4_en.noblocklist_train_text/dup_counts_df.feather ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f9af4398cd1f9b8c9c8675a18d63cbb320b4c47fc3de49d224334627010bd7a
3
+ size 1186
cache_dir/c4_en.noblocklist_train_text/fig_tok_length.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37ed8d608292aa5e69262330128c981eafaac42debbb616cef0403cf6048afb4
3
+ size 1536266
cache_dir/c4_en.noblocklist_train_text/general_stats_dict.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69dc02aff74877535f762d3b94d9a9e3d21f44bf081b7797f367351ae1c3c614
3
+ size 90
cache_dir/c4_en.noblocklist_train_text/length_df.feather ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:204bbaed8b3b94dacad4bdb8c2872d402974079fb243b4ee20497118ab9317f0
3
+ size 314450450
cache_dir/c4_en.noblocklist_train_text/length_stats.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7e4b8a8c42856f08f45036e48cda529520a0424e7e60de21b2baf328eb59784
3
+ size 63
cache_dir/c4_en.noblocklist_train_text/npmi_terms.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40fe28d565cdaf341298dba8af66ddd48428cb15ff58f5a838277139c4a865b3
3
+ size 191
cache_dir/c4_en.noblocklist_train_text/pmi_files/gay-lesbian_npmi.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01a4cd5032c59bfcc4a0c572252e67e6d7801a2fb8cd13adbc5b450b624c19e8
3
+ size 3004532
cache_dir/c4_en.noblocklist_train_text/pmi_files/gay-man_npmi.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1c70a5bf630958a22f526e6e90d8ec0cbb039a436f6d915bac04dfc4bccfdd9
3
+ size 5631101
cache_dir/c4_en.noblocklist_train_text/pmi_files/gay_npmi.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c0b0eb158578cb1ae97f7e9a5007a4cde33a139f8d36add2619fe4a9756d4ca
3
+ size 2403437
cache_dir/c4_en.noblocklist_train_text/pmi_files/gay_pmi.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:933c98af333b3afa5293e54d0b16b3dcefd88d9e0c5237f8a1a61bf857a5c9ed
3
+ size 2319355
cache_dir/c4_en.noblocklist_train_text/pmi_files/gay_vocab_cooc.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e000ee8ec5920b4a60d7f9128b7704c24b3f10bd61d235f498b1cfa91e8d6c3
3
+ size 8689948
cache_dir/c4_en.noblocklist_train_text/pmi_files/lesbian_npmi.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e021274c447e576477f48567b71349c78a41055b5c37f050b63c4e1695b8ebe6
3
+ size 1473301
cache_dir/c4_en.noblocklist_train_text/pmi_files/lesbian_pmi.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85d19fc45ce8ad18764330d7fa03c7d130bd14f82375bd3f0b5b64a9c181a024
3
+ size 1403773
cache_dir/c4_en.noblocklist_train_text/pmi_files/lesbian_vocab_cooc.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39035f60bc993e8c5486cbc1f2583c21cdff9125792f051d67ebaed5e426b601
3
+ size 8683596
cache_dir/c4_en.noblocklist_train_text/pmi_files/man-woman_npmi.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e5b4be41e3bf27caa1dc3dc1d32f5a1ddd07d0b3a2dcccf55184bfd43878a41
3
+ size 10214552
cache_dir/c4_en.noblocklist_train_text/pmi_files/man_npmi.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75ff803bcf3725431f64373cb1d13ac06c89c81722d6a69fab9cc3e3def3c6c1
3
+ size 7246942
cache_dir/c4_en.noblocklist_train_text/pmi_files/man_pmi.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7954bd84651437369ecda7efd7a4c6cfaac295dbc00f774ae5d612ee49a07e05
3
+ size 6995264
cache_dir/c4_en.noblocklist_train_text/pmi_files/man_vocab_cooc.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:317087c0b6d54213e3e1a2ff945762548c3fd9b00a7fd88851cc1da054e25543
3
+ size 8722467
cache_dir/c4_en.noblocklist_train_text/pmi_files/woman_npmi.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1c030423138bfce91bdc90522c3ed864e1f3cc82b891982d413a9a3540f324c
3
+ size 4684288
cache_dir/c4_en.noblocklist_train_text/pmi_files/woman_pmi.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:562339994ad9c79787dab69c19d1639a3e8955181d1f76944278fbca283a5827
3
+ size 4370814
cache_dir/c4_en.noblocklist_train_text/pmi_files/woman_vocab_cooc.csv ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b913c7cd4acfc1808d0b2bd37c7772c7148ded2feb89b2808b2eb892579dd5cf
3
+ size 8708146
cache_dir/c4_en.noblocklist_train_text/sorted_top_vocab.feather ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84050c5750071dbc056c19e7ffff4424f49f75deda43fada493d204142fccfe9
3
+ size 4162
cache_dir/c4_en.noblocklist_train_text/text_dset/dataset.arrow ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5361ec9eb9b50421ed8615e5c085e581250279acbb63e14a708b3fac8a5a7da7
3
+ size 504343120
cache_dir/c4_en.noblocklist_train_text/text_dset/dataset_info.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff8ef8d4b1ed96d6c5578f2411ee4be6c39527df741212a35d343886131c5eff
3
+ size 932
cache_dir/c4_en.noblocklist_train_text/text_dset/state.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e74c523af8156f53de88477f782d517d4f1056ff84192000ffeeea13ea01331b
3
+ size 256
cache_dir/c4_en.noblocklist_train_text/vocab_counts.feather ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e813b0dd94883d8f6e5269ca19f5ab7fcbb99ee3ad88ce77c24d60d3f5904739
3
+ size 8525314
cache_dir/glue_cola_train_sentence/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:222977f6ab3c38fd76c2b191d32c5d254366b963c963eeae8ff0f9b6cf2b8b5a
3
+ size 4684
cache_dir/glue_cola_validation_sentence/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39a1bcf6af6461a3e71fb81dbc5f3078a622044fd4b327176a836099d09426a2
3
+ size 5939
cache_dir/glue_mnli_matched_validation_hypothesis/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fd6015fbb5b45168d324a128d9a66bdb1aedc5e8a24a1f47f692758aa0a1d7c
3
+ size 18743
cache_dir/glue_mnli_matched_validation_premise/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fd6015fbb5b45168d324a128d9a66bdb1aedc5e8a24a1f47f692758aa0a1d7c
3
+ size 18743
cache_dir/glue_mnli_mismatched_validation_hypothesis/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:974161ba9d6598954f683adbf51ab50b7684dd53556311d5f491f1b166ebb805
3
+ size 19774
cache_dir/glue_mnli_mismatched_validation_premise/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:974161ba9d6598954f683adbf51ab50b7684dd53556311d5f491f1b166ebb805
3
+ size 19774
cache_dir/glue_mnli_train_hypothesis/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b89d0b39d7d1cf07b62eb6f355e74f4cb98cacd2fc6cfa7c0cf0599b2f5151f8
3
+ size 19503
cache_dir/glue_mnli_train_premise/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b89d0b39d7d1cf07b62eb6f355e74f4cb98cacd2fc6cfa7c0cf0599b2f5151f8
3
+ size 19503
cache_dir/glue_mnli_validation_matched_hypothesis/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fd6015fbb5b45168d324a128d9a66bdb1aedc5e8a24a1f47f692758aa0a1d7c
3
+ size 18743
cache_dir/glue_mnli_validation_matched_premise/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fd6015fbb5b45168d324a128d9a66bdb1aedc5e8a24a1f47f692758aa0a1d7c
3
+ size 18743
cache_dir/glue_mnli_validation_mismatched_hypothesis/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:974161ba9d6598954f683adbf51ab50b7684dd53556311d5f491f1b166ebb805
3
+ size 19774
cache_dir/glue_mnli_validation_mismatched_premise/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:974161ba9d6598954f683adbf51ab50b7684dd53556311d5f491f1b166ebb805
3
+ size 19774
cache_dir/glue_mrpc_train_sentence1/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bc1c7fd9daf223d2e5d55e89bc8f1de82435115fd3a72f1ac66393cfc1a5e08
3
+ size 24645
cache_dir/glue_mrpc_train_sentence2/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bc1c7fd9daf223d2e5d55e89bc8f1de82435115fd3a72f1ac66393cfc1a5e08
3
+ size 24645
cache_dir/glue_mrpc_validation_sentence1/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cccc3f1ed71a6d7815d59d0823f7a89f3a2e02fc956cceef6b3beeabd3cda0d1
3
+ size 25471
cache_dir/glue_mrpc_validation_sentence2/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cccc3f1ed71a6d7815d59d0823f7a89f3a2e02fc956cceef6b3beeabd3cda0d1
3
+ size 25471
cache_dir/glue_qnli_train_question/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d04156d796676c879c7a92016422bba27619cff0df37ff3ac0f98b21a6f3223
3
+ size 24469
cache_dir/glue_qnli_train_sentence/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d04156d796676c879c7a92016422bba27619cff0df37ff3ac0f98b21a6f3223
3
+ size 24469
cache_dir/glue_qnli_validation_question/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5db1c6538c353da266b50bfd84907f98c8890da1624ad6d66b37f4ba66a2dad
3
+ size 25142
cache_dir/glue_qnli_validation_sentence/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5db1c6538c353da266b50bfd84907f98c8890da1624ad6d66b37f4ba66a2dad
3
+ size 25142
cache_dir/glue_qqp_train_question1/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81357acfa3a1d2a51ec507e88c2d711e2e483757f0d76c1a33088dc88e6bea42
3
+ size 13229
cache_dir/glue_qqp_train_question2/dset_peek.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81357acfa3a1d2a51ec507e88c2d711e2e483757f0d76c1a33088dc88e6bea42
3
+ size 13229