Vaibhav Adlakha commited on
Commit
ae2f666
1 Parent(s): c05fcec

adding metadata for llm2vec models

Browse files
Files changed (1) hide show
  1. app.py +30 -0
app.py CHANGED
@@ -341,6 +341,12 @@ EXTERNAL_MODELS = [
341
  "DanskBERT",
342
  "LASER2",
343
  "LaBSE",
 
 
 
 
 
 
344
  "OpenSearch-text-hybrid",
345
  "all-MiniLM-L12-v2",
346
  "all-MiniLM-L6-v2",
@@ -453,6 +459,12 @@ EXTERNAL_MODEL_TO_LINK = {
453
  "Cohere-embed-english-v3.0": "https://huggingface.co/Cohere/Cohere-embed-english-v3.0",
454
  "Cohere-embed-multilingual-v3.0": "https://huggingface.co/Cohere/Cohere-embed-multilingual-v3.0",
455
  "Cohere-embed-multilingual-light-v3.0": "https://huggingface.co/Cohere/Cohere-embed-multilingual-light-v3.0",
 
 
 
 
 
 
456
  "allenai-specter": "https://huggingface.co/sentence-transformers/allenai-specter",
457
  "allenai-specter": "https://huggingface.co/sentence-transformers/allenai-specter",
458
  "all-MiniLM-L12-v2": "https://huggingface.co/sentence-transformers/all-MiniLM-L12-v2",
@@ -577,6 +589,12 @@ EXTERNAL_MODEL_TO_DIM = {
577
  "Cohere-embed-english-v3.0": 1024,
578
  "Cohere-embed-multilingual-v3.0": 1024,
579
  "Cohere-embed-multilingual-light-v3.0": 384,
 
 
 
 
 
 
580
  "all-MiniLM-L12-v2": 384,
581
  "all-MiniLM-L6-v2": 384,
582
  "all-mpnet-base-v2": 768,
@@ -700,6 +718,12 @@ EXTERNAL_MODEL_TO_SEQLEN = {
700
  "Cohere-embed-english-v3.0": 512,
701
  "Cohere-embed-multilingual-v3.0": 512,
702
  "Cohere-embed-multilingual-light-v3.0": 512,
 
 
 
 
 
 
703
  "all-MiniLM-L12-v2": 512,
704
  "all-MiniLM-L6-v2": 512,
705
  "all-mpnet-base-v2": 514,
@@ -820,6 +844,12 @@ EXTERNAL_MODEL_TO_SEQLEN = {
820
  }
821
 
822
  EXTERNAL_MODEL_TO_SIZE = {
 
 
 
 
 
 
823
  "allenai-specter": 110,
824
  "all-MiniLM-L12-v2": 33,
825
  "all-MiniLM-L6-v2": 23,
 
341
  "DanskBERT",
342
  "LASER2",
343
  "LaBSE",
344
+ "LLM2Vec-Llama-supervised",
345
+ "LLM2Vec-Llama-unsupervised",
346
+ "LLM2Vec-Mistral-supervised",
347
+ "LLM2Vec-Mistral-unsupervised",
348
+ "LLM2Vec-Sheared-Llama-supervised",
349
+ "LLM2Vec-Sheared-Llama-unsupervised",
350
  "OpenSearch-text-hybrid",
351
  "all-MiniLM-L12-v2",
352
  "all-MiniLM-L6-v2",
 
459
  "Cohere-embed-english-v3.0": "https://huggingface.co/Cohere/Cohere-embed-english-v3.0",
460
  "Cohere-embed-multilingual-v3.0": "https://huggingface.co/Cohere/Cohere-embed-multilingual-v3.0",
461
  "Cohere-embed-multilingual-light-v3.0": "https://huggingface.co/Cohere/Cohere-embed-multilingual-light-v3.0",
462
+ "LLM2Vec-Llama-supervised": "https://huggingface.co/McGill-NLP/LLM2Vec-Llama-2-7b-chat-hf-mntp-supervised",
463
+ "LLM2Vec-Llama-unsupervised": "https://huggingface.co/McGill-NLP/LLM2Vec-Llama-2-7b-chat-hf-mntp",
464
+ "LLM2Vec-Mistral-supervised": "https://huggingface.co/McGill-NLP/LLM2Vec-Mistral-7B-Instruct-v2-mntp-supervised",
465
+ "LLM2Vec-Mistral-unsupervised": "https://huggingface.co/McGill-NLP/LLM2Vec-Mistral-7B-Instruct-v2-mntp",
466
+ "LLM2Vec-Sheared-Llama-supervised": "https://huggingface.co/McGill-NLP/LLM2Vec-Sheared-LLaMA-mntp-supervised",
467
+ "LLM2Vec-Sheared-Llama-unsupervised": "https://huggingface.co/McGill-NLP/LLM2Vec-Sheared-LLaMA-mntp",
468
  "allenai-specter": "https://huggingface.co/sentence-transformers/allenai-specter",
469
  "allenai-specter": "https://huggingface.co/sentence-transformers/allenai-specter",
470
  "all-MiniLM-L12-v2": "https://huggingface.co/sentence-transformers/all-MiniLM-L12-v2",
 
589
  "Cohere-embed-english-v3.0": 1024,
590
  "Cohere-embed-multilingual-v3.0": 1024,
591
  "Cohere-embed-multilingual-light-v3.0": 384,
592
+ "LLM2Vec-Llama-supervised": 4096,
593
+ "LLM2Vec-Llama-unsupervised": 4096,
594
+ "LLM2Vec-Mistral-supervised": 4096,
595
+ "LLM2Vec-Mistral-unsupervised": 4096,
596
+ "LLM2Vec-Sheared-Llama-supervised": 2048,
597
+ "LLM2Vec-Sheared-Llama-unsupervised": 2048,
598
  "all-MiniLM-L12-v2": 384,
599
  "all-MiniLM-L6-v2": 384,
600
  "all-mpnet-base-v2": 768,
 
718
  "Cohere-embed-english-v3.0": 512,
719
  "Cohere-embed-multilingual-v3.0": 512,
720
  "Cohere-embed-multilingual-light-v3.0": 512,
721
+ "LLM2Vec-Llama-supervised": 512,
722
+ "LLM2Vec-Llama-unsupervised": 512,
723
+ "LLM2Vec-Mistral-supervised": 512,
724
+ "LLM2Vec-Mistral-unsupervised": 512,
725
+ "LLM2Vec-Sheared-Llama-supervised": 512,
726
+ "LLM2Vec-Sheared-Llama-unsupervised": 512,
727
  "all-MiniLM-L12-v2": 512,
728
  "all-MiniLM-L6-v2": 512,
729
  "all-mpnet-base-v2": 514,
 
844
  }
845
 
846
  EXTERNAL_MODEL_TO_SIZE = {
847
+ "LLM2Vec-Llama-supervised": 6607,
848
+ "LLM2Vec-Llama-unsupervised": 6607,
849
+ "LLM2Vec-Mistral-supervised": 7111,
850
+ "LLM2Vec-Mistral-unsupervised": 7111,
851
+ "LLM2Vec-Sheared-Llama-supervised": 1280,
852
+ "LLM2Vec-Sheared-Llama-unsupervised": 1280,
853
  "allenai-specter": 110,
854
  "all-MiniLM-L12-v2": 33,
855
  "all-MiniLM-L6-v2": 23,