Skip to content

Commit

Permalink
retrained models to fix bug in original training
Browse files Browse the repository at this point in the history
  • Loading branch information
vanbujm committed Sep 27, 2024
1 parent 4d9917b commit 3cb2bc3
Show file tree
Hide file tree
Showing 16 changed files with 31 additions and 53 deletions.
6 changes: 5 additions & 1 deletion src/trian/train_cai.py
Original file line number Diff line number Diff line change
Expand Up @@ -141,4 +141,8 @@ def formatting_func(example):

trainer.train()

trainer.save_model("./ultrachat_baseline")
trainer.save_model("./ultrachat_cai")

trainer.push_to_hub("vanbujm/ultrachat_cai")
tokenizer.push_to_hub("vanbujm/ultrachat_cai")

3 changes: 2 additions & 1 deletion ultrachat_baseline/README.md
Original file line number Diff line number Diff line change
@@ -1,6 +1,7 @@
---
library_name: transformers
tags: []
tags:
- unsloth
---

# Model Card for Model ID
Expand Down
8 changes: 4 additions & 4 deletions ultrachat_baseline/adapter_config.json
Original file line number Diff line number Diff line change
Expand Up @@ -20,13 +20,13 @@
"rank_pattern": {},
"revision": null,
"target_modules": [
"v_proj",
"down_proj",
"up_proj",
"o_proj",
"k_proj",
"up_proj",
"q_proj",
"gate_proj"
"gate_proj",
"down_proj",
"v_proj"
],
"task_type": "CAUSAL_LM",
"use_dora": false,
Expand Down
4 changes: 2 additions & 2 deletions ultrachat_baseline/adapter_model.safetensors
Git LFS file not shown
8 changes: 1 addition & 7 deletions ultrachat_baseline/special_tokens_map.json
Original file line number Diff line number Diff line change
Expand Up @@ -13,13 +13,7 @@
"rstrip": false,
"single_word": false
},
"pad_token": {
"content": "</s>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false
},
"pad_token": "<unk>",
"unk_token": {
"content": "<unk>",
"lstrip": false,
Expand Down
7 changes: 1 addition & 6 deletions ultrachat_baseline/tokenizer.json
Original file line number Diff line number Diff line change
@@ -1,11 +1,6 @@
{
"version": "1.0",
"truncation": {
"direction": "Right",
"max_length": 4096,
"strategy": "LongestFirst",
"stride": 0
},
"truncation": null,
"padding": null,
"added_tokens": [
{
Expand Down
Binary file added ultrachat_baseline/tokenizer.model
Binary file not shown.
9 changes: 3 additions & 6 deletions ultrachat_baseline/tokenizer_config.json
Original file line number Diff line number Diff line change
Expand Up @@ -34,15 +34,12 @@
"clean_up_tokenization_spaces": false,
"eos_token": "</s>",
"legacy": false,
"max_length": 4096,
"model_max_length": 1000000000000000019884624838656,
"pad_token": "</s>",
"model_max_length": 32768,
"pad_token": "<unk>",
"padding_side": "right",
"sp_model_kwargs": {},
"spaces_between_special_tokens": false,
"stride": 0,
"tokenizer_class": "LlamaTokenizer",
"truncation_side": "right",
"truncation_strategy": "longest_first",
"unk_token": "<unk>",
"use_default_system_prompt": false
}
Binary file modified ultrachat_baseline/training_args.bin
Binary file not shown.
3 changes: 2 additions & 1 deletion ultrachat_cai/README.md
Original file line number Diff line number Diff line change
@@ -1,6 +1,7 @@
---
library_name: transformers
tags: []
tags:
- unsloth
---

# Model Card for Model ID
Expand Down
8 changes: 4 additions & 4 deletions ultrachat_cai/adapter_config.json
Original file line number Diff line number Diff line change
Expand Up @@ -20,13 +20,13 @@
"rank_pattern": {},
"revision": null,
"target_modules": [
"v_proj",
"down_proj",
"gate_proj",
"q_proj",
"k_proj",
"q_proj",
"o_proj",
"up_proj",
"v_proj",
"o_proj"
"gate_proj"
],
"task_type": "CAUSAL_LM",
"use_dora": false,
Expand Down
4 changes: 2 additions & 2 deletions ultrachat_cai/adapter_model.safetensors
Git LFS file not shown
8 changes: 1 addition & 7 deletions ultrachat_cai/special_tokens_map.json
Original file line number Diff line number Diff line change
Expand Up @@ -13,13 +13,7 @@
"rstrip": false,
"single_word": false
},
"pad_token": {
"content": "</s>",
"lstrip": false,
"normalized": false,
"rstrip": false,
"single_word": false
},
"pad_token": "<unk>",
"unk_token": {
"content": "<unk>",
"lstrip": false,
Expand Down
7 changes: 1 addition & 6 deletions ultrachat_cai/tokenizer.json
Original file line number Diff line number Diff line change
@@ -1,11 +1,6 @@
{
"version": "1.0",
"truncation": {
"direction": "Right",
"max_length": 4096,
"strategy": "LongestFirst",
"stride": 0
},
"truncation": null,
"padding": null,
"added_tokens": [
{
Expand Down
9 changes: 3 additions & 6 deletions ultrachat_cai/tokenizer_config.json
Original file line number Diff line number Diff line change
Expand Up @@ -34,15 +34,12 @@
"clean_up_tokenization_spaces": false,
"eos_token": "</s>",
"legacy": false,
"max_length": 4096,
"model_max_length": 1000000000000000019884624838656,
"pad_token": "</s>",
"model_max_length": 32768,
"pad_token": "<unk>",
"padding_side": "right",
"sp_model_kwargs": {},
"spaces_between_special_tokens": false,
"stride": 0,
"tokenizer_class": "LlamaTokenizer",
"truncation_side": "right",
"truncation_strategy": "longest_first",
"unk_token": "<unk>",
"use_default_system_prompt": false
}
Binary file modified ultrachat_cai/training_args.bin
Binary file not shown.

0 comments on commit 3cb2bc3

Please sign in to comment.