Upload folder using huggingface_hub

Files changed (5) hide show

README.md CHANGED Viewed

@@ -146,7 +146,8 @@ print(processor.decode(out[0], skip_special_tokens=True))
 ##### In 8-bit precision (`int8`)
 >**Important:** Paper results only use int8 for the LLM weights while this loads all weights in int8.
-> We see that this gives slightly worse results but currently, int8 for some model parts is not supported by HuggingFace.
 <details>
 <summary> Click to expand </summary>

 ##### In 8-bit precision (`int8`)
 >**Important:** Paper results only use int8 for the LLM weights while this loads all weights in int8.
+> We see that this gives slightly worse results but currently int8 for some model parts is not supported by HuggingFace.
 <details>
 <summary> Click to expand </summary>

config.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
-  "_commit_hash": "56fa1691779eaa22d603ca6ffa463f9adc05ac5f",
   "architectures": [
-    "Blip2ForConditionalGeneration"
   ],
   "initializer_factor": 1.0,
   "initializer_range": 0.02,
@@ -82,13 +82,13 @@
     "top_p": 1.0,
     "torch_dtype": null,
     "torchscript": false,
-    "transformers_version": "4.30.2",
     "typical_p": 1.0,
     "use_bfloat16": false,
     "vocab_size": 30522
   },
   "text_config": {
-    "_name_or_path": "",
     "add_cross_attention": false,
     "architectures": [
       "MT5ForConditionalGeneration"
@@ -164,7 +164,7 @@
     "top_p": 1.0,
     "torch_dtype": "float32",
     "torchscript": false,
-    "transformers_version": "4.30.2",
     "typical_p": 1.0,
     "use_bfloat16": false,
     "use_cache": true,
@@ -211,7 +211,7 @@
       "LABEL_0": 0,
       "LABEL_1": 1
     },
-    "layer_norm_eps": 1e-05,
     "length_penalty": 1.0,
     "max_length": 20,
     "min_length": 0,
@@ -249,7 +249,7 @@
     "top_p": 1.0,
     "torch_dtype": null,
     "torchscript": false,
-    "transformers_version": "4.30.2",
     "typical_p": 1.0,
     "use_bfloat16": false
   }

 {
+  "_commit_hash": "cc2bb7bce2f7d4d1c37753c7e9c05a443a226614",
   "architectures": [
+    "mBLIP"
   ],
   "initializer_factor": 1.0,
   "initializer_range": 0.02,
     "top_p": 1.0,
     "torch_dtype": null,
     "torchscript": false,
+    "transformers_version": "4.31.0",
     "typical_p": 1.0,
     "use_bfloat16": false,
     "vocab_size": 30522
   },
   "text_config": {
+    "_name_or_path": "/media/gregor/DATA/projects/wuerzburg/mblip/checkpoints/mt0-xl/07_24_2023_08_03_33-1-79282",
     "add_cross_attention": false,
     "architectures": [
       "MT5ForConditionalGeneration"
     "top_p": 1.0,
     "torch_dtype": "float32",
     "torchscript": false,
+    "transformers_version": "4.31.0",
     "typical_p": 1.0,
     "use_bfloat16": false,
     "use_cache": true,
       "LABEL_0": 0,
       "LABEL_1": 1
     },
+    "layer_norm_eps": 1e-06,
     "length_penalty": 1.0,
     "max_length": 20,
     "min_length": 0,
     "top_p": 1.0,
     "torch_dtype": null,
     "torchscript": false,
+    "transformers_version": "4.31.0",
     "typical_p": 1.0,
     "use_bfloat16": false
   }

pytorch_model-00001-of-00002.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:eff61f2f4a6d9f018d6b114f3266bd528dee8c8d902d4d8bdfd709d1f6f934ff
+size 9960301947

pytorch_model-00002-of-00002.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:d26f5efafa5b50329ad9212aa899f6a283404c0d07a8bffc0b0b94c42128b815
+size 9381409638

pytorch_model.bin.index.json CHANGED Viewed

The diff for this file is too large to render. See raw diff