diff --git a/README.md b/README.md index d2826c1..8ab2c7b 100644 --- a/README.md +++ b/README.md @@ -109,17 +109,17 @@ tensor([[0.5485, 0.0551], # Model List - ## Mistral-7B - - ### [Bi + MNTP]() - - ### [Bi + MNTP + SimCSE]() (Unsupervised state-of-the-art on MTEB) + - ### [Bi + MNTP](https://huggingface.co/McGill-NLP/LLM2Vec-Mistral-7B-Instruct-v2-mntp) + - ### [Bi + MNTP + SimCSE](https://huggingface.co/McGill-NLP/LLM2Vec-Mistral-7B-Instruct-v2-unsup-simcse) (Unsupervised state-of-the-art on MTEB) - ### [Bi + MNTP + Supervised](https://huggingface.co/McGill-NLP/LLM2Vec-Mistral-7B-Instruct-v2-mntp-supervised) (state-of-the-art on MTEB among models trained on public data) - ## Llama-2-7B - - ### [Bi + MNTP]() - - ### [Bi + MNTP + SimCSE]() - - ### [Bi + MNTP + Supervised]() + - ### [Bi + MNTP](https://huggingface.co/McGill-NLP/LLM2Vec-Llama-2-7b-chat-hf-mntp) + - ### [Bi + MNTP + SimCSE](https://huggingface.co/McGill-NLP/LLM2Vec-Llama-2-7b-chat-hf-unsup-simcse) + - ### [Bi + MNTP + Supervised](https://huggingface.co/McGill-NLP/LLM2Vec-Llama-2-7b-chat-hf-mntp-supervised) - ## Sheared-Llama-1.3B - - ### [Bi + MNTP]() - - ### [Bi + MNTP + SimCSE]() - - ### [Bi + MNTP + Supervised]() + - ### [Bi + MNTP](https://huggingface.co/McGill-NLP/LLM2Vec-Sheared-LLaMA-mntp) + - ### [Bi + MNTP + SimCSE](https://huggingface.co/McGill-NLP/LLM2Vec-Sheared-LLaMA-unsup-simcse) + - ### [Bi + MNTP + Supervised](https://huggingface.co/McGill-NLP/LLM2Vec-Sheared-LLaMA-mntp-supervised) # Training Training code will be available soon.