Upload folder using huggingface_hub

Files changed (5) hide show

configuration_codeshell.py CHANGED Viewed

@@ -99,11 +99,11 @@ class CodeShellConfig(PretrainedConfig):
     def __init__(
         self,
-        vocab_size=50257,
-        n_positions=1024,
-        n_embd=768,
-        n_layer=12,
-        n_head=12,
         n_inner=None,
         activation_function="gelu_pytorch_tanh",
         resid_pdrop=0.1,
@@ -113,8 +113,8 @@ class CodeShellConfig(PretrainedConfig):
         initializer_range=0.02,
         scale_attn_weights=True,
         use_cache=True,
-        bos_token_id=50256,
-        eos_token_id=50256,
         attention_softmax_in_fp32=True,
         scale_attention_softmax_in_fp32=True,
         group_query_attention=True,

     def __init__(
         self,
+        vocab_size=70144,
+        n_positions=8192,
+        n_embd=4096,
+        n_layer=42,
+        n_head=32,
         n_inner=None,
         activation_function="gelu_pytorch_tanh",
         resid_pdrop=0.1,
         initializer_range=0.02,
         scale_attn_weights=True,
         use_cache=True,
+        bos_token_id=70000,
+        eos_token_id=70000,
         attention_softmax_in_fp32=True,
         scale_attention_softmax_in_fp32=True,
         group_query_attention=True,

merges.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

model-00001-of-00002.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:35affc26417d78eaaeaeb0dad037c4d1b7632018413b742892ea4bd72aac18fd
 size 9955659648

 version https://git-lfs.github.com/spec/v1
+oid sha256:911eb9034a0be6d4dde83bb2957d89bb0dcf3ad153737e6a58e455f0c05c071a
 size 9955659648

model-00002-of-00002.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:24eb05f7e6c43d3bb2d3cd51d14bf6063fd8b37e6df3d193423ba3c10c1d3da5
 size 5420501688

 version https://git-lfs.github.com/spec/v1
+oid sha256:19377de31c1b367d59a3470329b2e1b09ab5eda4f4dafbaba03ed8a4095060a3
 size 5420501688

quantizer.py CHANGED Viewed

@@ -1,3 +1,18 @@
 try:
     import bitsandbytes as bnb
     from bitsandbytes.nn.modules import Params4bit, Int8Params

+# coding=utf-8
+# Copyright 2023 WisdomShell Inc. All Rights Reserved.
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
 try:
     import bitsandbytes as bnb
     from bitsandbytes.nn.modules import Params4bit, Int8Params