pere commited on
Commit
ca95bbe
·
1 Parent(s): 08de38c
config.json CHANGED
@@ -1,12 +1,15 @@
1
  {
2
- "_name_or_path": "meta-llama/Llama-3.1-70B",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
6
  "attention_bias": false,
7
  "attention_dropout": 0.0,
8
  "bos_token_id": 128000,
9
- "eos_token_id": 128001,
 
 
 
 
10
  "head_dim": 128,
11
  "hidden_act": "silu",
12
  "hidden_size": 8192,
@@ -29,8 +32,8 @@
29
  },
30
  "rope_theta": 500000.0,
31
  "tie_word_embeddings": false,
32
- "torch_dtype": "float32",
33
- "transformers_version": "4.46.3",
34
  "use_cache": true,
35
  "vocab_size": 128256
36
  }
 
1
  {
 
2
  "architectures": [
3
  "LlamaForCausalLM"
4
  ],
5
  "attention_bias": false,
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 128000,
8
+ "eos_token_id": [
9
+ 128001,
10
+ 128008,
11
+ 128009
12
+ ],
13
  "head_dim": 128,
14
  "hidden_act": "silu",
15
  "hidden_size": 8192,
 
32
  },
33
  "rope_theta": 500000.0,
34
  "tie_word_embeddings": false,
35
+ "torch_dtype": "bfloat16",
36
+ "transformers_version": "4.53.3",
37
  "use_cache": true,
38
  "vocab_size": 128256
39
  }
generation_config.json CHANGED
@@ -1,9 +1,10 @@
1
  {
2
  "_from_model_config": true,
3
  "bos_token_id": 128000,
4
- "do_sample": true,
5
- "eos_token_id": 128001,
6
- "temperature": 0.6,
7
- "top_p": 0.9,
8
- "transformers_version": "4.46.3"
 
9
  }
 
1
  {
2
  "_from_model_config": true,
3
  "bos_token_id": 128000,
4
+ "eos_token_id": [
5
+ 128001,
6
+ 128008,
7
+ 128009
8
+ ],
9
+ "transformers_version": "4.53.3"
10
  }
model-00001-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:baac216ab63c1f706aca9d262a80b17177d58aacd491277fc0df40500cd2646e
3
- size 4584408792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91c1b1bc95d19a4c3ee5f7b1f5e7cca098a9600ffd7b9cb4d38fc249df2807d7
3
+ size 4584408808
model-00002-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5cce802c6a4057210004e74851a08cb1f934fa0d54d2bc097ed3d589ba197461
3
- size 4664167352
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6dcea70a6ef74e633a821d2f6db12436c6dabeb3fe87a3719b52a2e33ccb214
3
+ size 4664167376
model-00003-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:65c8e99d496f5a0cb10bf139456f08049c0c4fc328b2c82b066704c3651a5ce9
3
- size 4999711672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e266279a8f8f4760c82bcb32f20ffddfd213345ca5f8701227d4e8766aeda3b8
3
+ size 4999711704
model-00004-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:48fff05a994229772faaf742604f3c799ba75c7993b17138503db6ffe7e83b8e
3
- size 4966157008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b128d781558dedfa0d6b45af8d341cbb6803ef0f29d6e1c36d54ec5c21d42f5f
3
+ size 4966157032
model-00005-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8efdaa793b687a9aa0a237d2d2914bcb661ccf19bc64f8559de54cc6d39585a9
3
- size 4664134384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:176fb5cb050fcaaca57278f97975199dcdfff76aeb733b0528afbdd58d76b2e1
3
+ size 4664134408
model-00006-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:441433ca374d68b25b7c594fbdeffa2ce4816bb6155cdd5b4e69b0d6670ee8e1
3
- size 4664167384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ab56f6be33c7d9d80bd137a38e4185f7306973d41982742e59bd30fd1cbe0e8
3
+ size 4664167408
model-00007-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1dd6af77c7f49b833fce8894fbf6d25d1fae9fd69d6308d8e052aa5e66bca093
3
- size 4664167376
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1f00b9f24f9ed096cead200d94d28ef43575c8c892db88cc1f3fa4ff7bb70f8
3
+ size 4664167408
model-00008-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:477d234c3cd7ce0ca73fc74b7ac47aad17fe913ac9a5fcc36a5b21d07df26561
3
- size 4999711704
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ff39bfd1a4e3b5eed0b6d4ddeb0a318269469aaf4f3851ee6901128279bca59
3
+ size 4999711728
model-00009-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f054c1ae7b4546defd88df59f7b21076024be0a1cc368b2b4cd1485fd4c1b3de
3
- size 4966157032
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc8f9e0814db58e41fade49b50d6e8372c17942b03a2db08cad9bc0dc9499a95
3
+ size 4966157056
model-00010-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:33236b46bd60270177bc2bc4ee8a68a4831e9aeac42cc2add77e75620dbd2c07
3
- size 4664134384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4a6fd29a53b031db32e22beb77ce19a990fffa6effba7237479aa06f2e6423f
3
+ size 4664134408
model-00011-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:236d301a13925bd65658f1df310ffbeaa7d55ded417869bb2997ec34c9fb0dac
3
- size 4664167384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83a73740d92a90c36b4cf6a36cc0300e970ce8dede225cd3ef2c1af353ea9dc1
3
+ size 4664167408
model-00012-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:578ef82e273c07c77a4fe30d65a2a19b60b2b89ba1c0532f5084744c4a8ede02
3
- size 4664167376
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e80efa1b2b5939e013780e9a9d4bedc51a6207c6726fec46dc60c92ebdba3388
3
+ size 4664167408
model-00013-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d9183f02f326a86b18926f77e2409f62947b2dd88689d6f7e1f6553eae5896aa
3
- size 4999711704
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec46d2630148a753e997b267b53cbfac52fb1f7f170dcf23fbeb530f7f286ea3
3
+ size 4999711728
model-00014-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca95799d8a13e942840368cd8882d0c2eda3710ce3834cee4e0f9ede950cd9a1
3
- size 4966157032
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81f3c3979dc5a7fc2b87d9ed9e1ab5bf45220cc5068046dc13d8bcde79cc55d5
3
+ size 4966157056
model-00015-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4670473180288055aa60d76a0de486396ba474c6ae200c731f2169ff654cb410
3
- size 4664134384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:603e93c3d4bef2cb4d070252d11c484c9451e29a75ab1c5c3ca9f087c1919396
3
+ size 4664134408
model-00016-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aad6ce03d0255a33f6d93097987ae674214c534d644998f1fb4498bf0fcf3820
3
- size 4664167384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5aa330bf094026c8f6ce14e5c97aaf12cd944b5fc93062a124d73c7564617a6
3
+ size 4664167408
model-00017-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1ad09d02f449ed05eab0a5775eee1ead693fff2c2667d8c8fc01c3eb5ef9d97a
3
- size 4664167376
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e23a2dcac37a6e26c96211cf071d3fd5bd4bcca8cb495e7db4fff6fce4b9811
3
+ size 4664167408
model-00018-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a7e75c9e2cf4fadf1d74502b59f0c8475fd77555a43d97ea23e3f896d8fe27dd
3
- size 4999711704
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f10e2a75d9133c56bd32f0a96c23bfc738a49d33df159c21570ee70d959ad77
3
+ size 4999711728
model-00019-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bef9c0d817c1a0a006de45690bafc24e06300fa0326dd1b3855f40cbb34e0f71
3
- size 4966157032
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:619c1ac3a5c0bb166585801ae8358e9f9a1924b992d6c0f41e2c2d6cd1e76d21
3
+ size 4966157056
model-00020-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:deadf82046a643b8a6660b3d3759b24d02b5b2bb076139caa1073f14f963bf4a
3
- size 4664134384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f052a16e9321d9c563c0059d5a01ef7384c84b30edc76a89b5e59dfce1ef0dd
3
+ size 4664134408
model-00021-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:53e4f081c7d99651cdc2e2525fb14eba42d19f57e593d5aef4b4856402e80de4
3
- size 4664167384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea1b7f2c13cdaa9d04f370df58f1edda29ecfb7496cd05a0f1ad0923745ae7c1
3
+ size 4664167408
model-00022-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:00ec762ca92badeec1a588d3e15a99d7f6dcc304919397dd78376c042e0d7a18
3
- size 4664167376
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:773b03635f38418b027f068fa162790ae62cde3267b397f62b7392740e787948
3
+ size 4664167408
model-00023-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:06aa71a3eba3efc73dbaa30feb1fd7926710b8414e95e6652503de09871a22bf
3
- size 4999711704
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5993527e1dd735c0da5fe7687f8fcd6ddd7cc7a51ea459b8d637c39f86637434
3
+ size 4999711728
model-00024-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:47fe8139976f2ea1a75a5380f8e9cb89e04a1ab82d0fe2b71903231af5ca16ca
3
- size 4966157032
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc177516a3b06b4b63a34e56e3342ee1c939f38e107f2fea9cc355f33f96b4f4
3
+ size 4966157056
model-00025-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:13fbaf9fedeb530a6b905d317a8aa5016a33acddd9aa7860f578fd989eb37a8d
3
- size 4664134384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa569ed5c8a605fbfe239f087379b1e4630fde9657de2ef231f8a9fdf15e2cf3
3
+ size 4664134408
model-00026-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af4fef67f3aa6b822428d607e25595c733558c67b6f0988267669884624d79b1
3
- size 4664167384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e90307865422293a504835f6acfc95d026c9f8138551930ced245b069869975
3
+ size 4664167408
model-00027-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b26667beb4b073534384b018fbdece596a8f46e9930e8514f6613fbb3457a267
3
- size 4664167376
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de43f48b65ad52513625a5187e69c1b92c72aee838642fc1f87ba661415e2e9f
3
+ size 4664167408
model-00028-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dbc8562a99f7757d2533115870728d412e887d4c3b71356a6a2b5b325105e395
3
- size 4999711704
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b079e8bc2dc220228b36bf62b6032303b0cd310b23f84dd26083be80fd504fec
3
+ size 4999711728
model-00029-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:076c0423c5be3cde85c9c7bbb0a91e0fc43273b734ec8c0df4bf4dedd438b82c
3
- size 4966157032
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdaf68c948e9cde93c4ad11179dc51f29df9fa3774bc8d06b79750730427537d
3
+ size 4966157056
model-00030-of-00030.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e4db3e7db2757a18ccd860632652f72d893749e14604f4271c600de352d11220
3
- size 2101362904
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:958154a0f5250be9c7243ab9b860d286ca31202a90839b16f6809376ed679b9f
3
+ size 2101362912
model.safetensors.index.json CHANGED
@@ -1,5 +1,6 @@
1
  {
2
  "metadata": {
 
3
  "total_size": 141107412992
4
  },
5
  "weight_map": {
 
1
  {
2
  "metadata": {
3
+ "total_parameters": 70553706496,
4
  "total_size": 141107412992
5
  },
6
  "weight_map": {
tokenizer.json CHANGED
@@ -410560,4 +410560,4 @@
410560
  "éĶ ¦"
410561
  ]
410562
  }
410563
- }
 
410560
  "éĶ ¦"
410561
  ]
410562
  }
410563
+ }
tokenizer_config.json CHANGED
@@ -2050,8 +2050,9 @@
2050
  }
2051
  },
2052
  "bos_token": "<|begin_of_text|>",
 
2053
  "clean_up_tokenization_spaces": true,
2054
- "eos_token": "<|end_of_text|>",
2055
  "model_input_names": [
2056
  "input_ids",
2057
  "attention_mask"
 
2050
  }
2051
  },
2052
  "bos_token": "<|begin_of_text|>",
2053
+ "chat_template": "{{- bos_token }}\n{%- if custom_tools is defined %}\n {%- set tools = custom_tools %}\n{%- endif %}\n{%- if not tools_in_user_message is defined %}\n {%- set tools_in_user_message = true %}\n{%- endif %}\n{%- if not date_string is defined %}\n {%- if strftime_now is defined %}\n {%- set date_string = strftime_now(\"%d %b %Y\") %}\n {%- else %}\n {%- set date_string = \"26 Jul 2024\" %}\n {%- endif %}\n{%- endif %}\n{%- if not tools is defined %}\n {%- set tools = none %}\n{%- endif %}\n\n{#- This block extracts the system message, so we can slot it into the right place. #}\n{%- if messages[0]['role'] == 'system' %}\n {%- set system_message = messages[0]['content']|trim %}\n {%- set messages = messages[1:] %}\n{%- else %}\n {%- set system_message = \"\" %}\n{%- endif %}\n\n{#- System message #}\n{{- \"<|start_header_id|>system<|end_header_id|>\\n\\n\" }}\n{%- if tools is not none %}\n {{- \"Environment: ipython\\n\" }}\n{%- endif %}\n{{- \"Cutting Knowledge Date: December 2023\\n\" }}\n{{- \"Today Date: \" + date_string + \"\\n\\n\" }}\n{%- if tools is not none and not tools_in_user_message %}\n {{- \"You have access to the following functions. To call a function, please respond with JSON for a function call.\" }}\n {{- 'Respond in the format {\"name\": function name, \"parameters\": dictionary of argument name and its value}.' }}\n {{- \"Do not use variables.\\n\\n\" }}\n {%- for t in tools %}\n {{- t | tojson(indent=4) }}\n {{- \"\\n\\n\" }}\n {%- endfor %}\n{%- endif %}\n{{- system_message }}\n{{- \"<|eot_id|>\" }}\n\n{#- Custom tools are passed in a user message with some extra guidance #}\n{%- if tools_in_user_message and not tools is none %}\n {#- Extract the first user message so we can plug it in here #}\n {%- if messages | length != 0 %}\n {%- set first_user_message = messages[0]['content']|trim %}\n {%- set messages = messages[1:] %}\n {%- else %}\n {{- raise_exception(\"Cannot put tools in the first user message when there's no first user message!\") }}\n{%- endif %}\n {{- '<|start_header_id|>user<|end_header_id|>\\n\\n' -}}\n {{- \"Given the following functions, please respond with a JSON for a function call \" }}\n {{- \"with its proper arguments that best answers the given prompt.\\n\\n\" }}\n {{- 'Respond in the format {\"name\": function name, \"parameters\": dictionary of argument name and its value}.' }}\n {{- \"Do not use variables.\\n\\n\" }}\n {%- for t in tools %}\n {{- t | tojson(indent=4) }}\n {{- \"\\n\\n\" }}\n {%- endfor %}\n {{- first_user_message + \"<|eot_id|>\"}}\n{%- endif %}\n\n{%- for message in messages %}\n {%- if not (message.role == 'ipython' or message.role == 'tool' or 'tool_calls' in message) %}\n {{- '<|start_header_id|>' + message['role'] + '<|end_header_id|>\\n\\n'+ message['content'] | trim + '<|eot_id|>' }}\n {%- elif 'tool_calls' in message %}\n {%- if not message.tool_calls|length == 1 %}\n {{- raise_exception(\"This model only supports single tool-calls at once!\") }}\n {%- endif %}\n {%- set tool_call = message.tool_calls[0].function %}\n {{- '<|start_header_id|>assistant<|end_header_id|>\\n\\n' -}}\n {{- '{\"name\": \"' + tool_call.name + '\", ' }}\n {{- '\"parameters\": ' }}\n {{- tool_call.arguments | tojson }}\n {{- \"}\" }}\n {{- \"<|eot_id|>\" }}\n {%- elif message.role == \"tool\" or message.role == \"ipython\" %}\n {{- \"<|start_header_id|>ipython<|end_header_id|>\\n\\n\" }}\n {%- if message.content is mapping or message.content is iterable %}\n {{- message.content | tojson }}\n {%- else %}\n {{- message.content }}\n {%- endif %}\n {{- \"<|eot_id|>\" }}\n {%- endif %}\n{%- endfor %}\n{%- if add_generation_prompt %}\n {{- '<|start_header_id|>assistant<|end_header_id|>\\n\\n' }}\n{%- endif %}\n",
2054
  "clean_up_tokenization_spaces": true,
2055
+ "eos_token": "<|eot_id|>",
2056
  "model_input_names": [
2057
  "input_ids",
2058
  "attention_mask"