v0.8.2

OlivierDehaene · OlivierDehaene · commit e7248fe90e27 · 2023-06-01T19:49:13.000+02:00
diff --git a/Cargo.lock b/Cargo.lock
diff --git a/Cargo.toml b/Cargo.toml
@@ -8,7 +8,7 @@ members = [
 ]
 
 [workspace.package]
-version = "0.8.1"
+version = "0.8.2"
 edition = "2021"
 authors = ["Olivier Dehaene"]
 homepage = "https://github.com/huggingface/text-generation-inference"
diff --git a/docs/openapi.json b/docs/openapi.json
@@ -10,7 +10,7 @@
       "name": "Apache 2.0",
       "url": "https://www.apache.org/licenses/LICENSE-2.0"
     },
-    "version": "0.8.1"
+    "version": "0.8.2"
   },
   "paths": {
     "/": {
diff --git a/server/pyproject.toml b/server/pyproject.toml
@@ -1,6 +1,6 @@
 [tool.poetry]
 name = "text-generation-server"
-version = "0.8.1"
+version = "0.8.2"
 description = "Text Generation Inference Python gRPC Server"
 authors = ["Olivier Dehaene <olivier@huggingface.co>"]
 
diff --git a/server/text_generation_server/models/__init__.py b/server/text_generation_server/models/__init__.py
@@ -138,7 +138,9 @@ def get_model(
                 trust_remote_code=trust_remote_code,
             )
 
-    config_dict, _ = PretrainedConfig.get_config_dict(model_id, revision=revision, trust_remote_code=trust_remote_code)
+    config_dict, _ = PretrainedConfig.get_config_dict(
+        model_id, revision=revision, trust_remote_code=trust_remote_code
+    )
     model_type = config_dict["model_type"]
 
     if model_type == "gpt_bigcode":
diff --git a/server/text_generation_server/models/flash_santacoder.py b/server/text_generation_server/models/flash_santacoder.py
@@ -87,7 +87,9 @@ def load_weights(
     ):
         for filename in filenames:
             with safe_open(
-                    filename, framework="pt", device=str(device) if quantize is None else "cpu"
+                filename,
+                framework="pt",
+                device=str(device) if quantize is None else "cpu",
             ) as f:
                 for key in f.keys():
                     value = f.get_tensor(key)
@@ -148,11 +150,13 @@ def load_weights(
                             module._parameters[param_name][: value.shape[0]] = value
                         elif "kv_attn.weight" in key:
                             module._parameters[param_name][
-                                model.transformer.head_size * model.transformer.num_heads :
+                                model.transformer.head_size
+                                * model.transformer.num_heads :
                             ] = value
                         elif "kv_attn.bias" in key:
                             module._parameters[param_name][
-                                model.transformer.head_size * model.transformer.num_heads :
+                                model.transformer.head_size
+                                * model.transformer.num_heads :
                             ] = value
                         else:
                             if current_parameter_tensor.shape != value.shape:

Original file line number	Diff line number	Diff line change
`@@ -8,7 +8,7 @@ members = [`
`8`	`8`	`]`
`9`	`9`
`10`	`10`	`[workspace.package]`
`11`		`-version = "0.8.1"`
	`11`	`+version = "0.8.2"`
`12`	`12`	`edition = "2021"`
`13`	`13`	`authors = ["Olivier Dehaene"]`
`14`	`14`	`homepage = "https://github.com/huggingface/text-generation-inference"`
Original file line number	Diff line number	Diff line change
`@@ -138,7 +138,9 @@ def get_model(`
`138`	`138`	`trust_remote_code=trust_remote_code,`
`139`	`139`	`)`
`140`	`140`
`141`		`- config_dict, _ = PretrainedConfig.get_config_dict(model_id, revision=revision, trust_remote_code=trust_remote_code)`
	`141`	`+ config_dict, _ = PretrainedConfig.get_config_dict(`
	`142`	`+ model_id, revision=revision, trust_remote_code=trust_remote_code`
	`143`	`+ )`
`142`	`144`	`model_type = config_dict["model_type"]`
`143`	`145`
`144`	`146`	`if model_type == "gpt_bigcode":`