Sentence Similarity
sentence-transformers
Safetensors
bert
feature-extraction
Generated from Trainer
dataset_size:244856
loss:CosineSimilarityLoss
Eval Results (legacy)
text-embeddings-inference
Instructions to use yahyaabd/allstats-semantic-search-mini-model-v2 with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- sentence-transformers
How to use yahyaabd/allstats-semantic-search-mini-model-v2 with sentence-transformers:
from sentence_transformers import SentenceTransformer model = SentenceTransformer("yahyaabd/allstats-semantic-search-mini-model-v2") sentences = [ "Bulan apa inflasi sebesar 0,63 persen terjadi pada tahun 2013?", "Pada bulan Mei 2013 terjadi inflasi sebesar 0,2 persen", "Nilai Tukar Petani (NTP) April 2024 sebesar 116,79 atau turun 2,18 persen.", "Posisi Kredit Perbankan<sup>1</sup>dalam Rupiah dan Valuta Asing Menurut Sektor Ekonomi (miliar rupiah), 2016-2018" ] embeddings = model.encode(sentences) similarities = model.similarity(embeddings, embeddings) print(similarities.shape) # [4, 4] - Notebooks
- Google Colab
- Kaggle
| { | |
| "added_tokens_decoder": { | |
| "0": { | |
| "content": "<s>", | |
| "lstrip": false, | |
| "normalized": false, | |
| "rstrip": false, | |
| "single_word": false, | |
| "special": true | |
| }, | |
| "1": { | |
| "content": "<pad>", | |
| "lstrip": false, | |
| "normalized": false, | |
| "rstrip": false, | |
| "single_word": false, | |
| "special": true | |
| }, | |
| "2": { | |
| "content": "</s>", | |
| "lstrip": false, | |
| "normalized": false, | |
| "rstrip": false, | |
| "single_word": false, | |
| "special": true | |
| }, | |
| "3": { | |
| "content": "<unk>", | |
| "lstrip": false, | |
| "normalized": false, | |
| "rstrip": false, | |
| "single_word": false, | |
| "special": true | |
| }, | |
| "250001": { | |
| "content": "<mask>", | |
| "lstrip": true, | |
| "normalized": false, | |
| "rstrip": false, | |
| "single_word": false, | |
| "special": true | |
| } | |
| }, | |
| "bos_token": "<s>", | |
| "clean_up_tokenization_spaces": false, | |
| "cls_token": "<s>", | |
| "do_lower_case": true, | |
| "eos_token": "</s>", | |
| "extra_special_tokens": {}, | |
| "mask_token": "<mask>", | |
| "max_length": 128, | |
| "model_max_length": 128, | |
| "pad_to_multiple_of": null, | |
| "pad_token": "<pad>", | |
| "pad_token_type_id": 0, | |
| "padding_side": "right", | |
| "sep_token": "</s>", | |
| "stride": 0, | |
| "strip_accents": null, | |
| "tokenize_chinese_chars": true, | |
| "tokenizer_class": "BertTokenizer", | |
| "truncation_side": "right", | |
| "truncation_strategy": "longest_first", | |
| "unk_token": "<unk>" | |
| } | |