yahyaabd commited on
Commit
504f3cf
·
verified ·
1 Parent(s): 647e4c9

Upload folder using huggingface_hub

Browse files
README.md CHANGED
@@ -110,11 +110,11 @@ You can finetune this model on your own dataset.
110
 
111
  ### Framework Versions
112
  - Python: 3.11.12
113
- - Sentence Transformers: 3.4.1
114
  - Transformers: 4.51.3
115
  - PyTorch: 2.6.0+cu124
116
  - Accelerate: 1.6.0
117
- - Datasets:
118
  - Tokenizers: 0.21.1
119
 
120
  ## Citation
 
110
 
111
  ### Framework Versions
112
  - Python: 3.11.12
113
+ - Sentence Transformers: 4.1.0
114
  - Transformers: 4.51.3
115
  - PyTorch: 2.6.0+cu124
116
  - Accelerate: 1.6.0
117
+ - Datasets: 2.14.4
118
  - Tokenizers: 0.21.1
119
 
120
  ## Citation
added_tokens.json CHANGED
@@ -1,21 +1,32 @@
1
  {
 
 
2
  "BPP": 30551,
3
  "BPS": 30521,
4
  "BRS": 30566,
5
  "Badan Pusat Statistik": 30522,
6
  "CIF": 30556,
 
 
7
  "EKSPOR": 30573,
8
  "Ekspor": 30552,
9
  "FOB": 30555,
 
 
 
 
10
  "HLS": 30543,
11
  "HS": 30554,
 
12
  "IHK": 30525,
13
  "IHP": 30527,
14
  "IHPB": 30528,
15
  "IMK": 30532,
16
  "IMPOR": 30574,
 
17
  "IPH": 30526,
18
  "IPM": 30537,
 
19
  "ITB": 30531,
20
  "ITK": 30530,
21
  "Impor": 30553,
@@ -27,37 +38,57 @@
27
  "KKL": 30560,
28
  "KRT": 30563,
29
  "Katalog": 30571,
 
 
30
  "LPE": 30533,
31
  "LTN": 30549,
32
  "LTT": 30548,
 
 
 
 
33
  "Metadata": 30570,
34
  "NTP": 30529,
35
  "NTUP": 30550,
36
  "PDB": 30524,
37
  "PDRB": 30523,
38
  "PKL": 30559,
 
39
  "PUBLIKASI": 30576,
 
40
  "Publikasi": 30567,
41
  "RLS": 30544,
42
  "RT": 30564,
43
  "RW": 30565,
44
  "SAKERNAS": 30575,
45
  "SDGI": 30541,
 
46
  "SDKI": 30540,
 
47
  "SEKTORAL": 30579,
 
 
 
 
48
  "SP2020": 30538,
 
49
  "ST2013": 30547,
50
  "ST2023": 30546,
51
  "STATISTIK": 30578,
52
  "SUPAS": 30539,
53
  "SURVEI": 30581,
 
54
  "SUTAS": 30545,
55
  "Sakernas": 30557,
56
  "Sektoral": 30569,
 
57
  "Survei": 30572,
 
58
  "TPAK": 30558,
59
  "TPK": 30534,
60
  "TPT": 30535,
 
 
61
  "UMP": 30536,
62
  "_Statistik": 30568,
63
  "bpp": 30604,
@@ -65,7 +96,10 @@
65
  "cif": 30606,
66
  "fob": 30605,
67
  "hls": 30596,
 
68
  "ihk": 30583,
 
 
69
  "imk": 30587,
70
  "iph": 30584,
71
  "ipm": 30591,
@@ -81,15 +115,20 @@
81
  "ntp": 30585,
82
  "ntup": 30603,
83
  "pdrb": 30582,
 
84
  "rls": 30597,
85
  "sakernas": 30607,
86
  "sdgi": 30595,
87
  "sdki": 30594,
88
  "sektoral": 30614,
 
 
 
89
  "sp2020": 30592,
90
  "st2013": 30600,
91
  "st2023": 30599,
92
  "supas": 30593,
 
93
  "sutas": 30598,
94
  "tpak": 30608,
95
  "tpk": 30589,
 
1
  {
2
+ "ASFR": 30654,
3
+ "BOP": 30648,
4
  "BPP": 30551,
5
  "BPS": 30521,
6
  "BRS": 30566,
7
  "Badan Pusat Statistik": 30522,
8
  "CIF": 30556,
9
+ "CMR": 30649,
10
+ "CPI": 30639,
11
  "EKSPOR": 30573,
12
  "Ekspor": 30552,
13
  "FOB": 30555,
14
+ "GDP": 30637,
15
+ "GK": 30626,
16
+ "GRDP": 30638,
17
+ "HDI": 30641,
18
  "HLS": 30543,
19
  "HS": 30554,
20
+ "IBS": 30624,
21
  "IHK": 30525,
22
  "IHP": 30527,
23
  "IHPB": 30528,
24
  "IMK": 30532,
25
  "IMPOR": 30574,
26
+ "IMR": 30650,
27
  "IPH": 30526,
28
  "IPM": 30537,
29
+ "IPP": 30640,
30
  "ITB": 30531,
31
  "ITK": 30530,
32
  "Impor": 30553,
 
38
  "KKL": 30560,
39
  "KRT": 30563,
40
  "Katalog": 30571,
41
+ "LFPR": 30644,
42
+ "LFS": 30647,
43
  "LPE": 30533,
44
  "LTN": 30549,
45
  "LTT": 30548,
46
+ "MDGs": 30645,
47
+ "METADATA": 30627,
48
+ "MMR": 30652,
49
+ "MYS": 30643,
50
  "Metadata": 30570,
51
  "NTP": 30529,
52
  "NTUP": 30550,
53
  "PDB": 30524,
54
  "PDRB": 30523,
55
  "PKL": 30559,
56
+ "PODES": 30628,
57
  "PUBLIKASI": 30576,
58
+ "Podes": 30623,
59
  "Publikasi": 30567,
60
  "RLS": 30544,
61
  "RT": 30564,
62
  "RW": 30565,
63
  "SAKERNAS": 30575,
64
  "SDGI": 30541,
65
+ "SDGs": 30646,
66
  "SDKI": 30540,
67
+ "SE": 30621,
68
  "SEKTORAL": 30579,
69
+ "SHK": 30619,
70
+ "SKHI": 30625,
71
+ "SP": 30620,
72
+ "SP2010": 30616,
73
  "SP2020": 30538,
74
+ "ST": 30622,
75
  "ST2013": 30547,
76
  "ST2023": 30546,
77
  "STATISTIK": 30578,
78
  "SUPAS": 30539,
79
  "SURVEI": 30581,
80
+ "SUSENAS": 30618,
81
  "SUTAS": 30545,
82
  "Sakernas": 30557,
83
  "Sektoral": 30569,
84
+ "Statistik": 30617,
85
  "Survei": 30572,
86
+ "TFR": 30653,
87
  "TPAK": 30558,
88
  "TPK": 30534,
89
  "TPT": 30535,
90
+ "U5MR": 30651,
91
+ "UHC": 30642,
92
  "UMP": 30536,
93
  "_Statistik": 30568,
94
  "bpp": 30604,
 
96
  "cif": 30606,
97
  "fob": 30605,
98
  "hls": 30596,
99
+ "ibs": 30635,
100
  "ihk": 30583,
101
+ "ihp": 30629,
102
+ "ihpb": 30630,
103
  "imk": 30587,
104
  "iph": 30584,
105
  "ipm": 30591,
 
115
  "ntp": 30585,
116
  "ntup": 30603,
117
  "pdrb": 30582,
118
+ "podes": 30634,
119
  "rls": 30597,
120
  "sakernas": 30607,
121
  "sdgi": 30595,
122
  "sdki": 30594,
123
  "sektoral": 30614,
124
+ "shk": 30633,
125
+ "skhi": 30636,
126
+ "sp2010": 30631,
127
  "sp2020": 30592,
128
  "st2013": 30600,
129
  "st2023": 30599,
130
  "supas": 30593,
131
+ "susenas": 30632,
132
  "sutas": 30598,
133
  "tpak": 30608,
134
  "tpk": 30589,
config.json CHANGED
@@ -42,5 +42,5 @@
42
  "transformers_version": "4.51.3",
43
  "type_vocab_size": 2,
44
  "use_cache": true,
45
- "vocab_size": 30616
46
  }
 
42
  "transformers_version": "4.51.3",
43
  "type_vocab_size": 2,
44
  "use_cache": true,
45
+ "vocab_size": 30655
46
  }
config_sentence_transformers.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "__version__": {
3
- "sentence_transformers": "3.4.1",
4
  "transformers": "4.51.3",
5
  "pytorch": "2.6.0+cu124"
6
  },
 
1
  {
2
  "__version__": {
3
+ "sentence_transformers": "4.1.0",
4
  "transformers": "4.51.3",
5
  "pytorch": "2.6.0+cu124"
6
  },
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:54c6e7bf16068c5948125e9b4f15700979f4bea31f2154d0a2041f950686427d
3
- size 438240096
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ee2a7f419365e4f5aed12a0740460c5a4aa84365ced586546df0923664677ee
3
+ size 438359904
tokenizer.json CHANGED
@@ -902,6 +902,357 @@
902
  "rstrip": false,
903
  "normalized": true,
904
  "special": false
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
905
  }
906
  ],
907
  "normalizer": {
 
902
  "rstrip": false,
903
  "normalized": true,
904
  "special": false
905
+ },
906
+ {
907
+ "id": 30616,
908
+ "content": "SP2010",
909
+ "single_word": false,
910
+ "lstrip": false,
911
+ "rstrip": false,
912
+ "normalized": true,
913
+ "special": false
914
+ },
915
+ {
916
+ "id": 30617,
917
+ "content": "Statistik",
918
+ "single_word": false,
919
+ "lstrip": false,
920
+ "rstrip": false,
921
+ "normalized": true,
922
+ "special": false
923
+ },
924
+ {
925
+ "id": 30618,
926
+ "content": "SUSENAS",
927
+ "single_word": false,
928
+ "lstrip": false,
929
+ "rstrip": false,
930
+ "normalized": true,
931
+ "special": false
932
+ },
933
+ {
934
+ "id": 30619,
935
+ "content": "SHK",
936
+ "single_word": false,
937
+ "lstrip": false,
938
+ "rstrip": false,
939
+ "normalized": true,
940
+ "special": false
941
+ },
942
+ {
943
+ "id": 30620,
944
+ "content": "SP",
945
+ "single_word": false,
946
+ "lstrip": false,
947
+ "rstrip": false,
948
+ "normalized": true,
949
+ "special": false
950
+ },
951
+ {
952
+ "id": 30621,
953
+ "content": "SE",
954
+ "single_word": false,
955
+ "lstrip": false,
956
+ "rstrip": false,
957
+ "normalized": true,
958
+ "special": false
959
+ },
960
+ {
961
+ "id": 30622,
962
+ "content": "ST",
963
+ "single_word": false,
964
+ "lstrip": false,
965
+ "rstrip": false,
966
+ "normalized": true,
967
+ "special": false
968
+ },
969
+ {
970
+ "id": 30623,
971
+ "content": "Podes",
972
+ "single_word": false,
973
+ "lstrip": false,
974
+ "rstrip": false,
975
+ "normalized": true,
976
+ "special": false
977
+ },
978
+ {
979
+ "id": 30624,
980
+ "content": "IBS",
981
+ "single_word": false,
982
+ "lstrip": false,
983
+ "rstrip": false,
984
+ "normalized": true,
985
+ "special": false
986
+ },
987
+ {
988
+ "id": 30625,
989
+ "content": "SKHI",
990
+ "single_word": false,
991
+ "lstrip": false,
992
+ "rstrip": false,
993
+ "normalized": true,
994
+ "special": false
995
+ },
996
+ {
997
+ "id": 30626,
998
+ "content": "GK",
999
+ "single_word": false,
1000
+ "lstrip": false,
1001
+ "rstrip": false,
1002
+ "normalized": true,
1003
+ "special": false
1004
+ },
1005
+ {
1006
+ "id": 30627,
1007
+ "content": "METADATA",
1008
+ "single_word": false,
1009
+ "lstrip": false,
1010
+ "rstrip": false,
1011
+ "normalized": true,
1012
+ "special": false
1013
+ },
1014
+ {
1015
+ "id": 30628,
1016
+ "content": "PODES",
1017
+ "single_word": false,
1018
+ "lstrip": false,
1019
+ "rstrip": false,
1020
+ "normalized": true,
1021
+ "special": false
1022
+ },
1023
+ {
1024
+ "id": 30629,
1025
+ "content": "ihp",
1026
+ "single_word": false,
1027
+ "lstrip": false,
1028
+ "rstrip": false,
1029
+ "normalized": true,
1030
+ "special": false
1031
+ },
1032
+ {
1033
+ "id": 30630,
1034
+ "content": "ihpb",
1035
+ "single_word": false,
1036
+ "lstrip": false,
1037
+ "rstrip": false,
1038
+ "normalized": true,
1039
+ "special": false
1040
+ },
1041
+ {
1042
+ "id": 30631,
1043
+ "content": "sp2010",
1044
+ "single_word": false,
1045
+ "lstrip": false,
1046
+ "rstrip": false,
1047
+ "normalized": true,
1048
+ "special": false
1049
+ },
1050
+ {
1051
+ "id": 30632,
1052
+ "content": "susenas",
1053
+ "single_word": false,
1054
+ "lstrip": false,
1055
+ "rstrip": false,
1056
+ "normalized": true,
1057
+ "special": false
1058
+ },
1059
+ {
1060
+ "id": 30633,
1061
+ "content": "shk",
1062
+ "single_word": false,
1063
+ "lstrip": false,
1064
+ "rstrip": false,
1065
+ "normalized": true,
1066
+ "special": false
1067
+ },
1068
+ {
1069
+ "id": 30634,
1070
+ "content": "podes",
1071
+ "single_word": false,
1072
+ "lstrip": false,
1073
+ "rstrip": false,
1074
+ "normalized": true,
1075
+ "special": false
1076
+ },
1077
+ {
1078
+ "id": 30635,
1079
+ "content": "ibs",
1080
+ "single_word": false,
1081
+ "lstrip": false,
1082
+ "rstrip": false,
1083
+ "normalized": true,
1084
+ "special": false
1085
+ },
1086
+ {
1087
+ "id": 30636,
1088
+ "content": "skhi",
1089
+ "single_word": false,
1090
+ "lstrip": false,
1091
+ "rstrip": false,
1092
+ "normalized": true,
1093
+ "special": false
1094
+ },
1095
+ {
1096
+ "id": 30637,
1097
+ "content": "GDP",
1098
+ "single_word": false,
1099
+ "lstrip": false,
1100
+ "rstrip": false,
1101
+ "normalized": true,
1102
+ "special": false
1103
+ },
1104
+ {
1105
+ "id": 30638,
1106
+ "content": "GRDP",
1107
+ "single_word": false,
1108
+ "lstrip": false,
1109
+ "rstrip": false,
1110
+ "normalized": true,
1111
+ "special": false
1112
+ },
1113
+ {
1114
+ "id": 30639,
1115
+ "content": "CPI",
1116
+ "single_word": false,
1117
+ "lstrip": false,
1118
+ "rstrip": false,
1119
+ "normalized": true,
1120
+ "special": false
1121
+ },
1122
+ {
1123
+ "id": 30640,
1124
+ "content": "IPP",
1125
+ "single_word": false,
1126
+ "lstrip": false,
1127
+ "rstrip": false,
1128
+ "normalized": true,
1129
+ "special": false
1130
+ },
1131
+ {
1132
+ "id": 30641,
1133
+ "content": "HDI",
1134
+ "single_word": false,
1135
+ "lstrip": false,
1136
+ "rstrip": false,
1137
+ "normalized": true,
1138
+ "special": false
1139
+ },
1140
+ {
1141
+ "id": 30642,
1142
+ "content": "UHC",
1143
+ "single_word": false,
1144
+ "lstrip": false,
1145
+ "rstrip": false,
1146
+ "normalized": true,
1147
+ "special": false
1148
+ },
1149
+ {
1150
+ "id": 30643,
1151
+ "content": "MYS",
1152
+ "single_word": false,
1153
+ "lstrip": false,
1154
+ "rstrip": false,
1155
+ "normalized": true,
1156
+ "special": false
1157
+ },
1158
+ {
1159
+ "id": 30644,
1160
+ "content": "LFPR",
1161
+ "single_word": false,
1162
+ "lstrip": false,
1163
+ "rstrip": false,
1164
+ "normalized": true,
1165
+ "special": false
1166
+ },
1167
+ {
1168
+ "id": 30645,
1169
+ "content": "MDGs",
1170
+ "single_word": false,
1171
+ "lstrip": false,
1172
+ "rstrip": false,
1173
+ "normalized": true,
1174
+ "special": false
1175
+ },
1176
+ {
1177
+ "id": 30646,
1178
+ "content": "SDGs",
1179
+ "single_word": false,
1180
+ "lstrip": false,
1181
+ "rstrip": false,
1182
+ "normalized": true,
1183
+ "special": false
1184
+ },
1185
+ {
1186
+ "id": 30647,
1187
+ "content": "LFS",
1188
+ "single_word": false,
1189
+ "lstrip": false,
1190
+ "rstrip": false,
1191
+ "normalized": true,
1192
+ "special": false
1193
+ },
1194
+ {
1195
+ "id": 30648,
1196
+ "content": "BOP",
1197
+ "single_word": false,
1198
+ "lstrip": false,
1199
+ "rstrip": false,
1200
+ "normalized": true,
1201
+ "special": false
1202
+ },
1203
+ {
1204
+ "id": 30649,
1205
+ "content": "CMR",
1206
+ "single_word": false,
1207
+ "lstrip": false,
1208
+ "rstrip": false,
1209
+ "normalized": true,
1210
+ "special": false
1211
+ },
1212
+ {
1213
+ "id": 30650,
1214
+ "content": "IMR",
1215
+ "single_word": false,
1216
+ "lstrip": false,
1217
+ "rstrip": false,
1218
+ "normalized": true,
1219
+ "special": false
1220
+ },
1221
+ {
1222
+ "id": 30651,
1223
+ "content": "U5MR",
1224
+ "single_word": false,
1225
+ "lstrip": false,
1226
+ "rstrip": false,
1227
+ "normalized": true,
1228
+ "special": false
1229
+ },
1230
+ {
1231
+ "id": 30652,
1232
+ "content": "MMR",
1233
+ "single_word": false,
1234
+ "lstrip": false,
1235
+ "rstrip": false,
1236
+ "normalized": true,
1237
+ "special": false
1238
+ },
1239
+ {
1240
+ "id": 30653,
1241
+ "content": "TFR",
1242
+ "single_word": false,
1243
+ "lstrip": false,
1244
+ "rstrip": false,
1245
+ "normalized": true,
1246
+ "special": false
1247
+ },
1248
+ {
1249
+ "id": 30654,
1250
+ "content": "ASFR",
1251
+ "single_word": false,
1252
+ "lstrip": false,
1253
+ "rstrip": false,
1254
+ "normalized": true,
1255
+ "special": false
1256
  }
1257
  ],
1258
  "normalizer": {
tokenizer_config.json CHANGED
@@ -799,6 +799,318 @@
799
  "rstrip": false,
800
  "single_word": false,
801
  "special": false
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
802
  }
803
  },
804
  "clean_up_tokenization_spaces": true,
 
799
  "rstrip": false,
800
  "single_word": false,
801
  "special": false
802
+ },
803
+ "30616": {
804
+ "content": "SP2010",
805
+ "lstrip": false,
806
+ "normalized": true,
807
+ "rstrip": false,
808
+ "single_word": false,
809
+ "special": false
810
+ },
811
+ "30617": {
812
+ "content": "Statistik",
813
+ "lstrip": false,
814
+ "normalized": true,
815
+ "rstrip": false,
816
+ "single_word": false,
817
+ "special": false
818
+ },
819
+ "30618": {
820
+ "content": "SUSENAS",
821
+ "lstrip": false,
822
+ "normalized": true,
823
+ "rstrip": false,
824
+ "single_word": false,
825
+ "special": false
826
+ },
827
+ "30619": {
828
+ "content": "SHK",
829
+ "lstrip": false,
830
+ "normalized": true,
831
+ "rstrip": false,
832
+ "single_word": false,
833
+ "special": false
834
+ },
835
+ "30620": {
836
+ "content": "SP",
837
+ "lstrip": false,
838
+ "normalized": true,
839
+ "rstrip": false,
840
+ "single_word": false,
841
+ "special": false
842
+ },
843
+ "30621": {
844
+ "content": "SE",
845
+ "lstrip": false,
846
+ "normalized": true,
847
+ "rstrip": false,
848
+ "single_word": false,
849
+ "special": false
850
+ },
851
+ "30622": {
852
+ "content": "ST",
853
+ "lstrip": false,
854
+ "normalized": true,
855
+ "rstrip": false,
856
+ "single_word": false,
857
+ "special": false
858
+ },
859
+ "30623": {
860
+ "content": "Podes",
861
+ "lstrip": false,
862
+ "normalized": true,
863
+ "rstrip": false,
864
+ "single_word": false,
865
+ "special": false
866
+ },
867
+ "30624": {
868
+ "content": "IBS",
869
+ "lstrip": false,
870
+ "normalized": true,
871
+ "rstrip": false,
872
+ "single_word": false,
873
+ "special": false
874
+ },
875
+ "30625": {
876
+ "content": "SKHI",
877
+ "lstrip": false,
878
+ "normalized": true,
879
+ "rstrip": false,
880
+ "single_word": false,
881
+ "special": false
882
+ },
883
+ "30626": {
884
+ "content": "GK",
885
+ "lstrip": false,
886
+ "normalized": true,
887
+ "rstrip": false,
888
+ "single_word": false,
889
+ "special": false
890
+ },
891
+ "30627": {
892
+ "content": "METADATA",
893
+ "lstrip": false,
894
+ "normalized": true,
895
+ "rstrip": false,
896
+ "single_word": false,
897
+ "special": false
898
+ },
899
+ "30628": {
900
+ "content": "PODES",
901
+ "lstrip": false,
902
+ "normalized": true,
903
+ "rstrip": false,
904
+ "single_word": false,
905
+ "special": false
906
+ },
907
+ "30629": {
908
+ "content": "ihp",
909
+ "lstrip": false,
910
+ "normalized": true,
911
+ "rstrip": false,
912
+ "single_word": false,
913
+ "special": false
914
+ },
915
+ "30630": {
916
+ "content": "ihpb",
917
+ "lstrip": false,
918
+ "normalized": true,
919
+ "rstrip": false,
920
+ "single_word": false,
921
+ "special": false
922
+ },
923
+ "30631": {
924
+ "content": "sp2010",
925
+ "lstrip": false,
926
+ "normalized": true,
927
+ "rstrip": false,
928
+ "single_word": false,
929
+ "special": false
930
+ },
931
+ "30632": {
932
+ "content": "susenas",
933
+ "lstrip": false,
934
+ "normalized": true,
935
+ "rstrip": false,
936
+ "single_word": false,
937
+ "special": false
938
+ },
939
+ "30633": {
940
+ "content": "shk",
941
+ "lstrip": false,
942
+ "normalized": true,
943
+ "rstrip": false,
944
+ "single_word": false,
945
+ "special": false
946
+ },
947
+ "30634": {
948
+ "content": "podes",
949
+ "lstrip": false,
950
+ "normalized": true,
951
+ "rstrip": false,
952
+ "single_word": false,
953
+ "special": false
954
+ },
955
+ "30635": {
956
+ "content": "ibs",
957
+ "lstrip": false,
958
+ "normalized": true,
959
+ "rstrip": false,
960
+ "single_word": false,
961
+ "special": false
962
+ },
963
+ "30636": {
964
+ "content": "skhi",
965
+ "lstrip": false,
966
+ "normalized": true,
967
+ "rstrip": false,
968
+ "single_word": false,
969
+ "special": false
970
+ },
971
+ "30637": {
972
+ "content": "GDP",
973
+ "lstrip": false,
974
+ "normalized": true,
975
+ "rstrip": false,
976
+ "single_word": false,
977
+ "special": false
978
+ },
979
+ "30638": {
980
+ "content": "GRDP",
981
+ "lstrip": false,
982
+ "normalized": true,
983
+ "rstrip": false,
984
+ "single_word": false,
985
+ "special": false
986
+ },
987
+ "30639": {
988
+ "content": "CPI",
989
+ "lstrip": false,
990
+ "normalized": true,
991
+ "rstrip": false,
992
+ "single_word": false,
993
+ "special": false
994
+ },
995
+ "30640": {
996
+ "content": "IPP",
997
+ "lstrip": false,
998
+ "normalized": true,
999
+ "rstrip": false,
1000
+ "single_word": false,
1001
+ "special": false
1002
+ },
1003
+ "30641": {
1004
+ "content": "HDI",
1005
+ "lstrip": false,
1006
+ "normalized": true,
1007
+ "rstrip": false,
1008
+ "single_word": false,
1009
+ "special": false
1010
+ },
1011
+ "30642": {
1012
+ "content": "UHC",
1013
+ "lstrip": false,
1014
+ "normalized": true,
1015
+ "rstrip": false,
1016
+ "single_word": false,
1017
+ "special": false
1018
+ },
1019
+ "30643": {
1020
+ "content": "MYS",
1021
+ "lstrip": false,
1022
+ "normalized": true,
1023
+ "rstrip": false,
1024
+ "single_word": false,
1025
+ "special": false
1026
+ },
1027
+ "30644": {
1028
+ "content": "LFPR",
1029
+ "lstrip": false,
1030
+ "normalized": true,
1031
+ "rstrip": false,
1032
+ "single_word": false,
1033
+ "special": false
1034
+ },
1035
+ "30645": {
1036
+ "content": "MDGs",
1037
+ "lstrip": false,
1038
+ "normalized": true,
1039
+ "rstrip": false,
1040
+ "single_word": false,
1041
+ "special": false
1042
+ },
1043
+ "30646": {
1044
+ "content": "SDGs",
1045
+ "lstrip": false,
1046
+ "normalized": true,
1047
+ "rstrip": false,
1048
+ "single_word": false,
1049
+ "special": false
1050
+ },
1051
+ "30647": {
1052
+ "content": "LFS",
1053
+ "lstrip": false,
1054
+ "normalized": true,
1055
+ "rstrip": false,
1056
+ "single_word": false,
1057
+ "special": false
1058
+ },
1059
+ "30648": {
1060
+ "content": "BOP",
1061
+ "lstrip": false,
1062
+ "normalized": true,
1063
+ "rstrip": false,
1064
+ "single_word": false,
1065
+ "special": false
1066
+ },
1067
+ "30649": {
1068
+ "content": "CMR",
1069
+ "lstrip": false,
1070
+ "normalized": true,
1071
+ "rstrip": false,
1072
+ "single_word": false,
1073
+ "special": false
1074
+ },
1075
+ "30650": {
1076
+ "content": "IMR",
1077
+ "lstrip": false,
1078
+ "normalized": true,
1079
+ "rstrip": false,
1080
+ "single_word": false,
1081
+ "special": false
1082
+ },
1083
+ "30651": {
1084
+ "content": "U5MR",
1085
+ "lstrip": false,
1086
+ "normalized": true,
1087
+ "rstrip": false,
1088
+ "single_word": false,
1089
+ "special": false
1090
+ },
1091
+ "30652": {
1092
+ "content": "MMR",
1093
+ "lstrip": false,
1094
+ "normalized": true,
1095
+ "rstrip": false,
1096
+ "single_word": false,
1097
+ "special": false
1098
+ },
1099
+ "30653": {
1100
+ "content": "TFR",
1101
+ "lstrip": false,
1102
+ "normalized": true,
1103
+ "rstrip": false,
1104
+ "single_word": false,
1105
+ "special": false
1106
+ },
1107
+ "30654": {
1108
+ "content": "ASFR",
1109
+ "lstrip": false,
1110
+ "normalized": true,
1111
+ "rstrip": false,
1112
+ "single_word": false,
1113
+ "special": false
1114
  }
1115
  },
1116
  "clean_up_tokenization_spaces": true,