dtamayo commited on
Commit
ab5dd0a
Β·
1 Parent(s): 7101272

update model

Browse files
README.md CHANGED
@@ -54,19 +54,19 @@ Training Hyperparemeters
54
  >>> unmasker = pipeline('fill-mask', model='BSC-LT/MrBERT-science')
55
 
56
  >>> pprint(unmasker("Hubble's<mask>describes the expansion of the universe and the relationship between a galaxy's distance and its recessional velocity.", top_k=3))
57
- [{'score': 0.8203125,
58
  'sequence': "Hubble's law describes the expansion of the universe and the "
59
  "relationship between a galaxy's distance and its recessional "
60
  'velocity.',
61
  'token': 21673,
62
  'token_str': 'law'},
63
- {'score': 0.1259765625,
64
  'sequence': "Hubble's Law describes the expansion of the universe and the "
65
  "relationship between a galaxy's distance and its recessional "
66
  'velocity.',
67
  'token': 18573,
68
  'token_str': 'Law'},
69
- {'score': 0.0247802734375,
70
  'sequence': "Hubble's equation describes the expansion of the universe and "
71
  "the relationship between a galaxy's distance and its "
72
  'recessional velocity.',
 
54
  >>> unmasker = pipeline('fill-mask', model='BSC-LT/MrBERT-science')
55
 
56
  >>> pprint(unmasker("Hubble's<mask>describes the expansion of the universe and the relationship between a galaxy's distance and its recessional velocity.", top_k=3))
57
+ [{'score': 0.8211672902107239,
58
  'sequence': "Hubble's law describes the expansion of the universe and the "
59
  "relationship between a galaxy's distance and its recessional "
60
  'velocity.',
61
  'token': 21673,
62
  'token_str': 'law'},
63
+ {'score': 0.16654537618160248,
64
  'sequence': "Hubble's Law describes the expansion of the universe and the "
65
  "relationship between a galaxy's distance and its recessional "
66
  'velocity.',
67
  'token': 18573,
68
  'token_str': 'Law'},
69
+ {'score': 0.0063100955449044704,
70
  'sequence': "Hubble's equation describes the expansion of the universe and "
71
  "the relationship between a galaxy's distance and its "
72
  'recessional velocity.',
config.json CHANGED
@@ -12,6 +12,7 @@
12
  "cls_token_id": 1,
13
  "decoder_bias": true,
14
  "deterministic_flash_attn": false,
 
15
  "embedding_dropout": 0.0,
16
  "eos_token_id": 2,
17
  "global_attn_every_n_layers": 3,
@@ -35,9 +36,10 @@
35
  "num_hidden_layers": 22,
36
  "pad_token_id": 3,
37
  "position_embedding_type": "absolute",
 
38
  "sep_token_id": 2,
39
- "tie_word_embeddings": true,
40
- "torch_dtype": "bfloat16",
41
- "transformers_version": "4.48.0",
42
  "vocab_size": 256128
43
- }
 
12
  "cls_token_id": 1,
13
  "decoder_bias": true,
14
  "deterministic_flash_attn": false,
15
+ "dtype": "float32",
16
  "embedding_dropout": 0.0,
17
  "eos_token_id": 2,
18
  "global_attn_every_n_layers": 3,
 
36
  "num_hidden_layers": 22,
37
  "pad_token_id": 3,
38
  "position_embedding_type": "absolute",
39
+ "repad_logits_with_grad": false,
40
  "sep_token_id": 2,
41
+ "sparse_pred_ignore_index": -100,
42
+ "sparse_prediction": false,
43
+ "transformers_version": "4.56.2",
44
  "vocab_size": 256128
45
+ }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:481c17a5a9437d6079367583b7ad88683b6d85156bdeb4d19593ae833b8f6751
3
- size 1231552912
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c75df29298505934097bae2cee8afee8b66d68437928f2d2247ec4e0eb532e6c
3
+ size 1231552936
special_tokens_map.json CHANGED
@@ -1,4 +1,7 @@
1
  {
 
 
 
2
  "bos_token": {
3
  "content": "<s>",
4
  "lstrip": false,
@@ -15,7 +18,7 @@
15
  },
16
  "mask_token": {
17
  "content": "<mask>",
18
- "lstrip": true,
19
  "normalized": false,
20
  "rstrip": false,
21
  "single_word": false
@@ -34,4 +37,4 @@
34
  "rstrip": false,
35
  "single_word": false
36
  }
37
- }
 
1
  {
2
+ "additional_special_tokens": [
3
+ "<mask>"
4
+ ],
5
  "bos_token": {
6
  "content": "<s>",
7
  "lstrip": false,
 
18
  },
19
  "mask_token": {
20
  "content": "<mask>",
21
+ "lstrip": false,
22
  "normalized": false,
23
  "rstrip": false,
24
  "single_word": false
 
37
  "rstrip": false,
38
  "single_word": false
39
  }
40
+ }
tokenizer.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:031e825b2072f555233d0d01abc2cde072183173a53967e7e842813b9673748c
3
- size 19092952
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:641ca1224e2bfab63b3df7d6c3002384c358e1f28497741c6b943304d15ca9c2
3
+ size 37007965
tokenizer.model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5072e3209a04aa01dbf4db72b8fec52cf8cd06a042c9ba819678e084f7b665d5
3
- size 4813283
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ddbda5816a0138ffd754cbbfafceba9628342cdd91df4bea6ee86f0fb44eae9
3
+ size 4813260
tokenizer_config.json CHANGED
@@ -4,7 +4,7 @@
4
  "add_prefix_space": true,
5
  "added_tokens_decoder": {
6
  "0": {
7
- "content": "<s>",
8
  "lstrip": false,
9
  "normalized": false,
10
  "rstrip": false,
@@ -12,7 +12,7 @@
12
  "special": true
13
  },
14
  "1": {
15
- "content": "<pad>",
16
  "lstrip": false,
17
  "normalized": false,
18
  "rstrip": false,
@@ -28,7 +28,7 @@
28
  "special": true
29
  },
30
  "3": {
31
- "content": "<unk>",
32
  "lstrip": false,
33
  "normalized": false,
34
  "rstrip": false,
@@ -52,8 +52,8 @@
52
  "special": true
53
  },
54
  "6": {
55
- "content": "<|reserved_token_1|>",
56
- "lstrip": true,
57
  "normalized": false,
58
  "rstrip": false,
59
  "single_word": false,
@@ -828,7 +828,7 @@
828
  "special": true
829
  },
830
  "103": {
831
- "content": "<mask>",
832
  "lstrip": false,
833
  "normalized": false,
834
  "rstrip": false,
@@ -844,7 +844,7 @@
844
  "special": false
845
  },
846
  "105": {
847
- "content": "\u2581\u2581",
848
  "lstrip": false,
849
  "normalized": false,
850
  "rstrip": false,
@@ -852,7 +852,7 @@
852
  "special": false
853
  },
854
  "106": {
855
- "content": "\u2581\u2581\u2581",
856
  "lstrip": false,
857
  "normalized": false,
858
  "rstrip": false,
@@ -860,7 +860,7 @@
860
  "special": false
861
  },
862
  "107": {
863
- "content": "\u2581\u2581\u2581\u2581",
864
  "lstrip": false,
865
  "normalized": false,
866
  "rstrip": false,
@@ -868,7 +868,7 @@
868
  "special": false
869
  },
870
  "108": {
871
- "content": "\u2581\u2581\u2581\u2581\u2581",
872
  "lstrip": false,
873
  "normalized": false,
874
  "rstrip": false,
@@ -876,7 +876,7 @@
876
  "special": false
877
  },
878
  "109": {
879
- "content": "\u2581\u2581\u2581\u2581\u2581\u2581",
880
  "lstrip": false,
881
  "normalized": false,
882
  "rstrip": false,
@@ -884,7 +884,7 @@
884
  "special": false
885
  },
886
  "110": {
887
- "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
888
  "lstrip": false,
889
  "normalized": false,
890
  "rstrip": false,
@@ -892,7 +892,7 @@
892
  "special": false
893
  },
894
  "111": {
895
- "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
896
  "lstrip": false,
897
  "normalized": false,
898
  "rstrip": false,
@@ -900,7 +900,7 @@
900
  "special": false
901
  },
902
  "112": {
903
- "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
904
  "lstrip": false,
905
  "normalized": false,
906
  "rstrip": false,
@@ -908,7 +908,7 @@
908
  "special": false
909
  },
910
  "113": {
911
- "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
912
  "lstrip": false,
913
  "normalized": false,
914
  "rstrip": false,
@@ -916,7 +916,7 @@
916
  "special": false
917
  },
918
  "114": {
919
- "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
920
  "lstrip": false,
921
  "normalized": false,
922
  "rstrip": false,
@@ -924,7 +924,7 @@
924
  "special": false
925
  },
926
  "115": {
927
- "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
928
  "lstrip": false,
929
  "normalized": false,
930
  "rstrip": false,
@@ -932,7 +932,7 @@
932
  "special": false
933
  },
934
  "116": {
935
- "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
936
  "lstrip": false,
937
  "normalized": false,
938
  "rstrip": false,
@@ -940,7 +940,7 @@
940
  "special": false
941
  },
942
  "117": {
943
- "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
944
  "lstrip": false,
945
  "normalized": false,
946
  "rstrip": false,
@@ -948,7 +948,7 @@
948
  "special": false
949
  },
950
  "118": {
951
- "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
952
  "lstrip": false,
953
  "normalized": false,
954
  "rstrip": false,
@@ -956,7 +956,7 @@
956
  "special": false
957
  },
958
  "119": {
959
- "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
960
  "lstrip": false,
961
  "normalized": false,
962
  "rstrip": false,
@@ -964,7 +964,7 @@
964
  "special": false
965
  },
966
  "120": {
967
- "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
968
  "lstrip": false,
969
  "normalized": false,
970
  "rstrip": false,
@@ -972,7 +972,7 @@
972
  "special": false
973
  },
974
  "121": {
975
- "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
976
  "lstrip": false,
977
  "normalized": false,
978
  "rstrip": false,
@@ -980,7 +980,7 @@
980
  "special": false
981
  },
982
  "122": {
983
- "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
984
  "lstrip": false,
985
  "normalized": false,
986
  "rstrip": false,
@@ -988,7 +988,7 @@
988
  "special": false
989
  },
990
  "123": {
991
- "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
992
  "lstrip": false,
993
  "normalized": false,
994
  "rstrip": false,
@@ -996,7 +996,7 @@
996
  "special": false
997
  },
998
  "124": {
999
- "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1000
  "lstrip": false,
1001
  "normalized": false,
1002
  "rstrip": false,
@@ -1004,7 +1004,7 @@
1004
  "special": false
1005
  },
1006
  "125": {
1007
- "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1008
  "lstrip": false,
1009
  "normalized": false,
1010
  "rstrip": false,
@@ -1012,7 +1012,7 @@
1012
  "special": false
1013
  },
1014
  "126": {
1015
- "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1016
  "lstrip": false,
1017
  "normalized": false,
1018
  "rstrip": false,
@@ -1020,7 +1020,7 @@
1020
  "special": false
1021
  },
1022
  "127": {
1023
- "content": "\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581\u2581",
1024
  "lstrip": false,
1025
  "normalized": false,
1026
  "rstrip": false,
@@ -1084,9 +1084,13 @@
1084
  "special": false
1085
  }
1086
  },
 
 
 
1087
  "bos_token": "<s>",
1088
  "clean_up_tokenization_spaces": false,
1089
  "eos_token": "</s>",
 
1090
  "legacy": true,
1091
  "mask_token": "<mask>",
1092
  "model_max_length": 8192,
@@ -1095,9 +1099,5 @@
1095
  "spaces_between_special_tokens": false,
1096
  "tokenizer_class": "LlamaTokenizer",
1097
  "unk_token": "<unk>",
1098
- "use_default_system_prompt": false,
1099
- "model_input_names": [
1100
- "input_ids",
1101
- "attention_mask"
1102
- ]
1103
- }
 
4
  "add_prefix_space": true,
5
  "added_tokens_decoder": {
6
  "0": {
7
+ "content": "<unk>",
8
  "lstrip": false,
9
  "normalized": false,
10
  "rstrip": false,
 
12
  "special": true
13
  },
14
  "1": {
15
+ "content": "<s>",
16
  "lstrip": false,
17
  "normalized": false,
18
  "rstrip": false,
 
28
  "special": true
29
  },
30
  "3": {
31
+ "content": "<pad>",
32
  "lstrip": false,
33
  "normalized": false,
34
  "rstrip": false,
 
52
  "special": true
53
  },
54
  "6": {
55
+ "content": "<mask>",
56
+ "lstrip": false,
57
  "normalized": false,
58
  "rstrip": false,
59
  "single_word": false,
 
828
  "special": true
829
  },
830
  "103": {
831
+ "content": "<|reserved_token_98|>",
832
  "lstrip": false,
833
  "normalized": false,
834
  "rstrip": false,
 
844
  "special": false
845
  },
846
  "105": {
847
+ "content": "▁▁",
848
  "lstrip": false,
849
  "normalized": false,
850
  "rstrip": false,
 
852
  "special": false
853
  },
854
  "106": {
855
+ "content": "▁▁▁",
856
  "lstrip": false,
857
  "normalized": false,
858
  "rstrip": false,
 
860
  "special": false
861
  },
862
  "107": {
863
+ "content": "▁▁▁▁",
864
  "lstrip": false,
865
  "normalized": false,
866
  "rstrip": false,
 
868
  "special": false
869
  },
870
  "108": {
871
+ "content": "▁▁▁▁▁",
872
  "lstrip": false,
873
  "normalized": false,
874
  "rstrip": false,
 
876
  "special": false
877
  },
878
  "109": {
879
+ "content": "▁▁▁▁▁▁",
880
  "lstrip": false,
881
  "normalized": false,
882
  "rstrip": false,
 
884
  "special": false
885
  },
886
  "110": {
887
+ "content": "▁▁▁▁▁▁▁",
888
  "lstrip": false,
889
  "normalized": false,
890
  "rstrip": false,
 
892
  "special": false
893
  },
894
  "111": {
895
+ "content": "▁▁▁▁▁▁▁▁",
896
  "lstrip": false,
897
  "normalized": false,
898
  "rstrip": false,
 
900
  "special": false
901
  },
902
  "112": {
903
+ "content": "▁▁▁▁▁▁▁▁▁",
904
  "lstrip": false,
905
  "normalized": false,
906
  "rstrip": false,
 
908
  "special": false
909
  },
910
  "113": {
911
+ "content": "▁▁▁▁▁▁▁▁▁▁",
912
  "lstrip": false,
913
  "normalized": false,
914
  "rstrip": false,
 
916
  "special": false
917
  },
918
  "114": {
919
+ "content": "▁▁▁▁▁▁▁▁▁▁▁",
920
  "lstrip": false,
921
  "normalized": false,
922
  "rstrip": false,
 
924
  "special": false
925
  },
926
  "115": {
927
+ "content": "▁▁▁▁▁▁▁▁▁▁▁▁",
928
  "lstrip": false,
929
  "normalized": false,
930
  "rstrip": false,
 
932
  "special": false
933
  },
934
  "116": {
935
+ "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁",
936
  "lstrip": false,
937
  "normalized": false,
938
  "rstrip": false,
 
940
  "special": false
941
  },
942
  "117": {
943
+ "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
944
  "lstrip": false,
945
  "normalized": false,
946
  "rstrip": false,
 
948
  "special": false
949
  },
950
  "118": {
951
+ "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
952
  "lstrip": false,
953
  "normalized": false,
954
  "rstrip": false,
 
956
  "special": false
957
  },
958
  "119": {
959
+ "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
960
  "lstrip": false,
961
  "normalized": false,
962
  "rstrip": false,
 
964
  "special": false
965
  },
966
  "120": {
967
+ "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
968
  "lstrip": false,
969
  "normalized": false,
970
  "rstrip": false,
 
972
  "special": false
973
  },
974
  "121": {
975
+ "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
976
  "lstrip": false,
977
  "normalized": false,
978
  "rstrip": false,
 
980
  "special": false
981
  },
982
  "122": {
983
+ "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
984
  "lstrip": false,
985
  "normalized": false,
986
  "rstrip": false,
 
988
  "special": false
989
  },
990
  "123": {
991
+ "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
992
  "lstrip": false,
993
  "normalized": false,
994
  "rstrip": false,
 
996
  "special": false
997
  },
998
  "124": {
999
+ "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1000
  "lstrip": false,
1001
  "normalized": false,
1002
  "rstrip": false,
 
1004
  "special": false
1005
  },
1006
  "125": {
1007
+ "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1008
  "lstrip": false,
1009
  "normalized": false,
1010
  "rstrip": false,
 
1012
  "special": false
1013
  },
1014
  "126": {
1015
+ "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1016
  "lstrip": false,
1017
  "normalized": false,
1018
  "rstrip": false,
 
1020
  "special": false
1021
  },
1022
  "127": {
1023
+ "content": "▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
1024
  "lstrip": false,
1025
  "normalized": false,
1026
  "rstrip": false,
 
1084
  "special": false
1085
  }
1086
  },
1087
+ "additional_special_tokens": [
1088
+ "<mask>"
1089
+ ],
1090
  "bos_token": "<s>",
1091
  "clean_up_tokenization_spaces": false,
1092
  "eos_token": "</s>",
1093
+ "extra_special_tokens": {},
1094
  "legacy": true,
1095
  "mask_token": "<mask>",
1096
  "model_max_length": 8192,
 
1099
  "spaces_between_special_tokens": false,
1100
  "tokenizer_class": "LlamaTokenizer",
1101
  "unk_token": "<unk>",
1102
+ "use_default_system_prompt": false
1103
+ }