ia-espirita commited on
Commit
0454832
·
verified ·
1 Parent(s): d99ffb3

Upload model trained with Unsloth

Browse files

Upload model trained with Unsloth 2x faster

Files changed (3) hide show
  1. README.md +18 -17
  2. adapter_config.json +50 -0
  3. adapter_model.safetensors +3 -0
README.md CHANGED
@@ -1,28 +1,29 @@
1
  ---
2
  language:
3
- - pt
4
  license: apache-2.0
5
  tags:
6
- - spiritism
7
- - kardec
8
- - espiritismo
9
- - allan-kardec
10
- - religion
11
- - portuguese
12
- - brazilian
13
- - fine-tuned
14
- - qlora
15
- - llama-3
16
- - spirituality
17
- - riv-ai
18
- - espírita
 
19
  datasets:
20
- - ia-espirita/riv-ai-dataset
21
  base_model: meta-llama/Meta-Llama-3-8B-Instruct
22
  pipeline_tag: text-generation
23
  model-index:
24
- - name: riv-ai
25
- results: []
26
  ---
27
 
28
  # 🔮 RIV AI — Modelo de IA Espírita Open Source
 
1
  ---
2
  language:
3
+ - pt
4
  license: apache-2.0
5
  tags:
6
+ - spiritism
7
+ - kardec
8
+ - espiritismo
9
+ - allan-kardec
10
+ - religion
11
+ - portuguese
12
+ - brazilian
13
+ - fine-tuned
14
+ - qlora
15
+ - llama-3
16
+ - spirituality
17
+ - riv-ai
18
+ - espírita
19
+ - unsloth
20
  datasets:
21
+ - ia-espirita/riv-ai-dataset
22
  base_model: meta-llama/Meta-Llama-3-8B-Instruct
23
  pipeline_tag: text-generation
24
  model-index:
25
+ - name: riv-ai
26
+ results: []
27
  ---
28
 
29
  # 🔮 RIV AI — Modelo de IA Espírita Open Source
adapter_config.json ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alora_invocation_tokens": null,
3
+ "alpha_pattern": {},
4
+ "arrow_config": null,
5
+ "auto_mapping": {
6
+ "base_model_class": "LlamaForCausalLM",
7
+ "parent_library": "transformers.models.llama.modeling_llama",
8
+ "unsloth_fixed": true
9
+ },
10
+ "base_model_name_or_path": "unsloth/meta-llama-3.1-8b-instruct-unsloth-bnb-4bit",
11
+ "bias": "none",
12
+ "corda_config": null,
13
+ "ensure_weight_tying": false,
14
+ "eva_config": null,
15
+ "exclude_modules": null,
16
+ "fan_in_fan_out": false,
17
+ "inference_mode": true,
18
+ "init_lora_weights": true,
19
+ "layer_replication": null,
20
+ "layers_pattern": null,
21
+ "layers_to_transform": null,
22
+ "loftq_config": {},
23
+ "lora_alpha": 32,
24
+ "lora_bias": false,
25
+ "lora_dropout": 0,
26
+ "megatron_config": null,
27
+ "megatron_core": "megatron.core",
28
+ "modules_to_save": null,
29
+ "peft_type": "LORA",
30
+ "peft_version": "0.18.1",
31
+ "qalora_group_size": 16,
32
+ "r": 16,
33
+ "rank_pattern": {},
34
+ "revision": null,
35
+ "target_modules": [
36
+ "o_proj",
37
+ "up_proj",
38
+ "q_proj",
39
+ "down_proj",
40
+ "v_proj",
41
+ "gate_proj",
42
+ "k_proj"
43
+ ],
44
+ "target_parameters": null,
45
+ "task_type": "CAUSAL_LM",
46
+ "trainable_token_indices": null,
47
+ "use_dora": false,
48
+ "use_qalora": false,
49
+ "use_rslora": false
50
+ }
adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:430a1cfe022285dcbc5d7e50f3508dda11fa5b40c1feebc9f207414935112c5d
3
+ size 167832240