lmassaron commited on
Commit
38cb939
·
verified ·
1 Parent(s): 33813b0

lmassaron/gemma-3-1B-it-function_calling

Browse files
README.md CHANGED
@@ -34,10 +34,10 @@ This model was trained with SFT.
34
 
35
  ### Framework versions
36
 
37
- - TRL: 0.16.0
38
- - Transformers: 4.50.1
39
  - Pytorch: 2.6.0+cu124
40
- - Datasets: 3.4.1
41
  - Tokenizers: 0.21.1
42
 
43
  ## Citations
@@ -49,7 +49,7 @@ Cite TRL as:
49
  ```bibtex
50
  @misc{vonwerra2022trl,
51
  title = {{TRL: Transformer Reinforcement Learning}},
52
- author = {Leandro von Werra and Younes Belkada and Lewis Tunstall and Edward Beeching and Tristan Thrush and Nathan Lambert and Shengyi Huang and Kashif Rasul and Quentin Gallouédec},
53
  year = 2020,
54
  journal = {GitHub repository},
55
  publisher = {GitHub},
 
34
 
35
  ### Framework versions
36
 
37
+ - TRL: 0.17.0
38
+ - Transformers: 4.51.3
39
  - Pytorch: 2.6.0+cu124
40
+ - Datasets: 3.6.0
41
  - Tokenizers: 0.21.1
42
 
43
  ## Citations
 
49
  ```bibtex
50
  @misc{vonwerra2022trl,
51
  title = {{TRL: Transformer Reinforcement Learning}},
52
+ author = {Leandro von Werra and Younes Belkada and Lewis Tunstall and Edward Beeching and Tristan Thrush and Nathan Lambert and Shengyi Huang and Kashif Rasul and Quentin Gallou{\'e}dec},
53
  year = 2020,
54
  journal = {GitHub repository},
55
  publisher = {GitHub},
adapter_config.json CHANGED
@@ -24,15 +24,15 @@
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
 
 
 
 
27
  "lm_head",
 
28
  "q_proj",
29
  "up_proj",
30
- "v_proj",
31
- "embed_tokens",
32
- "gate_proj",
33
- "o_proj",
34
- "down_proj",
35
- "k_proj"
36
  ],
37
  "task_type": "CAUSAL_LM",
38
  "trainable_token_indices": null,
 
24
  "rank_pattern": {},
25
  "revision": null,
26
  "target_modules": [
27
+ "k_proj",
28
+ "o_proj",
29
+ "embed_tokens",
30
+ "down_proj",
31
  "lm_head",
32
+ "gate_proj",
33
  "q_proj",
34
  "up_proj",
35
+ "v_proj"
 
 
 
 
 
36
  ],
37
  "task_type": "CAUSAL_LM",
38
  "trainable_token_indices": null,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e187f5cc6bd7bbe6109db89bab83599b4445213bcfc853f76fd4cd2244064131
3
  size 1293936232
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5566bbb2855ca6935130a63d1ec7fc6804307891084ae08050201fb19a7d2fb
3
  size 1293936232
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:04bc29295560b97912b7adb4cf1f939d52985bfe392feda937699f9f3e878f6f
3
- size 5624
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08cfde619b67b4ed75a2fabf6a957f8c566fbaa6d42993c00ee1c1094e2d5c08
3
+ size 5688