Upload folder using huggingface_hub
Browse files- README.md +6 -6
- config.json +1 -1
- mergekit_config.yml +2 -2
- model-00001-of-00006.safetensors +1 -1
- model-00002-of-00006.safetensors +1 -1
- model-00003-of-00006.safetensors +1 -1
- model-00004-of-00006.safetensors +1 -1
- model-00005-of-00006.safetensors +1 -1
- model-00006-of-00006.safetensors +1 -1
README.md
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
---
|
| 2 |
base_model:
|
| 3 |
-
- jetuned/
|
| 4 |
-
-
|
| 5 |
library_name: transformers
|
| 6 |
tags:
|
| 7 |
- mergekit
|
|
@@ -15,12 +15,12 @@ This is a merge of pre-trained language models created using [mergekit](https://
|
|
| 15 |
## Merge Details
|
| 16 |
### Merge Method
|
| 17 |
|
| 18 |
-
This model was merged using the [DELLA](https://arxiv.org/abs/2406.11617) merge method using [jetuned/
|
| 19 |
|
| 20 |
### Models Merged
|
| 21 |
|
| 22 |
The following models were included in the merge:
|
| 23 |
-
* [
|
| 24 |
|
| 25 |
### Configuration
|
| 26 |
|
|
@@ -28,13 +28,13 @@ The following YAML configuration was used to produce this model:
|
|
| 28 |
|
| 29 |
```yaml
|
| 30 |
models:
|
| 31 |
-
- model:
|
| 32 |
parameters:
|
| 33 |
density: 1
|
| 34 |
weight: 1
|
| 35 |
lambda: 0.9
|
| 36 |
merge_method: della
|
| 37 |
-
base_model: jetuned/
|
| 38 |
parameters:
|
| 39 |
density: 1
|
| 40 |
weight: 1
|
|
|
|
| 1 |
---
|
| 2 |
base_model:
|
| 3 |
+
- jetuned/CosmoCoder
|
| 4 |
+
- Tesslate/Tessa-T1-14B
|
| 5 |
library_name: transformers
|
| 6 |
tags:
|
| 7 |
- mergekit
|
|
|
|
| 15 |
## Merge Details
|
| 16 |
### Merge Method
|
| 17 |
|
| 18 |
+
This model was merged using the [DELLA](https://arxiv.org/abs/2406.11617) merge method using [jetuned/CosmoCoder](https://huggingface.co/jetuned/CosmoCoder) as a base.
|
| 19 |
|
| 20 |
### Models Merged
|
| 21 |
|
| 22 |
The following models were included in the merge:
|
| 23 |
+
* [Tesslate/Tessa-T1-14B](https://huggingface.co/Tesslate/Tessa-T1-14B)
|
| 24 |
|
| 25 |
### Configuration
|
| 26 |
|
|
|
|
| 28 |
|
| 29 |
```yaml
|
| 30 |
models:
|
| 31 |
+
- model: Tesslate/Tessa-T1-14B
|
| 32 |
parameters:
|
| 33 |
density: 1
|
| 34 |
weight: 1
|
| 35 |
lambda: 0.9
|
| 36 |
merge_method: della
|
| 37 |
+
base_model: jetuned/CosmoCoder
|
| 38 |
parameters:
|
| 39 |
density: 1
|
| 40 |
weight: 1
|
config.json
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
{
|
| 2 |
-
"_name_or_path": "jetuned/
|
| 3 |
"architectures": [
|
| 4 |
"Qwen2ForCausalLM"
|
| 5 |
],
|
|
|
|
| 1 |
{
|
| 2 |
+
"_name_or_path": "jetuned/CosmoCoder",
|
| 3 |
"architectures": [
|
| 4 |
"Qwen2ForCausalLM"
|
| 5 |
],
|
mergekit_config.yml
CHANGED
|
@@ -1,11 +1,11 @@
|
|
| 1 |
models:
|
| 2 |
-
- model:
|
| 3 |
parameters:
|
| 4 |
density: 1
|
| 5 |
weight: 1
|
| 6 |
lambda: 0.9
|
| 7 |
merge_method: della
|
| 8 |
-
base_model: jetuned/
|
| 9 |
parameters:
|
| 10 |
density: 1
|
| 11 |
weight: 1
|
|
|
|
| 1 |
models:
|
| 2 |
+
- model: Tesslate/Tessa-T1-14B
|
| 3 |
parameters:
|
| 4 |
density: 1
|
| 5 |
weight: 1
|
| 6 |
lambda: 0.9
|
| 7 |
merge_method: della
|
| 8 |
+
base_model: jetuned/CosmoCoder
|
| 9 |
parameters:
|
| 10 |
density: 1
|
| 11 |
weight: 1
|
model-00001-of-00006.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4899283400
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cbb82355a8da6d18d89a30b8dd38c8d72a78423d0b117599962d73a8aeb2b926
|
| 3 |
size 4899283400
|
model-00002-of-00006.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4954847280
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c34e5f657ae34ae8949e43e46a00b46679a4495aae34abd9f23d52b0a4d65dc5
|
| 3 |
size 4954847280
|
model-00003-of-00006.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4954847272
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0ee694191d8fd5c08c707d6beca64a525a8415484d1c006bb5c6544255100821
|
| 3 |
size 4954847272
|
model-00004-of-00006.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4954847272
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ee44139b5658d6dcb3221032e2238d0298f39fa5d4a56f6e100d7e38e5bd37cc
|
| 3 |
size 4954847272
|
model-00005-of-00006.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4954847272
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:707600b8b0bcd29fc09275b3dc2639c5ecc7f76636e639bccbc9c2d098a8dfb4
|
| 3 |
size 4954847272
|
model-00006-of-00006.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4813289328
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1d24caf532fb9c28f088197640ee2db5de425f63b506f512d6c4f9f97a44b173
|
| 3 |
size 4813289328
|