fix_name_or_path (#13)
Browse files- Remove _name_or_path and load tokenizer from the model directory (895e040d1520583604d996d2357e22c8b85b11f1)
Co-authored-by: Timur Khanipov <[email protected]>
- config.json +0 -2
- modeling_gigarembed.py +1 -1
config.json
CHANGED
|
@@ -15,7 +15,6 @@
|
|
| 15 |
"is_mask_instruction": true,
|
| 16 |
"latent_attention_config": {
|
| 17 |
"_attn_implementation_autoset": false,
|
| 18 |
-
"_name_or_path": "",
|
| 19 |
"add_cross_attention": false,
|
| 20 |
"architectures": null,
|
| 21 |
"bad_words_ids": null,
|
|
@@ -88,7 +87,6 @@
|
|
| 88 |
"padding_side": "right",
|
| 89 |
"text_config": {
|
| 90 |
"_attn_implementation_autoset": false,
|
| 91 |
-
"_name_or_path": "ai-sage/Giga-Embeddings-instruct",
|
| 92 |
"add_cross_attention": false,
|
| 93 |
"apply_qk_norm": true,
|
| 94 |
"architectures": null,
|
|
|
|
| 15 |
"is_mask_instruction": true,
|
| 16 |
"latent_attention_config": {
|
| 17 |
"_attn_implementation_autoset": false,
|
|
|
|
| 18 |
"add_cross_attention": false,
|
| 19 |
"architectures": null,
|
| 20 |
"bad_words_ids": null,
|
|
|
|
| 87 |
"padding_side": "right",
|
| 88 |
"text_config": {
|
| 89 |
"_attn_implementation_autoset": false,
|
|
|
|
| 90 |
"add_cross_attention": false,
|
| 91 |
"apply_qk_norm": true,
|
| 92 |
"architectures": null,
|
modeling_gigarembed.py
CHANGED
|
@@ -965,7 +965,7 @@ class GigarEmbedModel(PreTrainedModel):
|
|
| 965 |
|
| 966 |
# Initialize tokenizer if text config is available
|
| 967 |
self.tokenizer = AutoTokenizer.from_pretrained(
|
| 968 |
-
configuration.
|
| 969 |
)
|
| 970 |
|
| 971 |
# Set configuration parameters
|
|
|
|
| 965 |
|
| 966 |
# Initialize tokenizer if text config is available
|
| 967 |
self.tokenizer = AutoTokenizer.from_pretrained(
|
| 968 |
+
configuration.name_or_path
|
| 969 |
)
|
| 970 |
|
| 971 |
# Set configuration parameters
|