serenarolloh
commited on
Commit
•
aabe3cc
1
Parent(s):
d4b35da
Training done
Browse files- added_tokens.json +6 -0
- tokenizer.json +54 -0
- tokenizer_config.json +48 -0
added_tokens.json
CHANGED
@@ -8,8 +8,10 @@
|
|
8 |
"</s_customer_no>": 57595,
|
9 |
"</s_customer_phone_no>": 57570,
|
10 |
"</s_customer_pin>": 57556,
|
|
|
11 |
"</s_customer_reference_no>": 57609,
|
12 |
"</s_cutomer_no>": 57599,
|
|
|
13 |
"</s_date>": 57530,
|
14 |
"</s_delivery_contact>": 57568,
|
15 |
"</s_delivery_contact_person>": 57619,
|
@@ -18,6 +20,7 @@
|
|
18 |
"</s_document_no>": 57593,
|
19 |
"</s_document_type>": 57528,
|
20 |
"</s_dropoff point>": 57590,
|
|
|
21 |
"</s_dropoff_point>": 57548,
|
22 |
"</s_header>": 57526,
|
23 |
"</s_invoice_no>": 57576,
|
@@ -58,8 +61,10 @@
|
|
58 |
"<s_customer_no>": 57594,
|
59 |
"<s_customer_phone_no>": 57569,
|
60 |
"<s_customer_pin>": 57555,
|
|
|
61 |
"<s_customer_reference_no>": 57608,
|
62 |
"<s_cutomer_no>": 57598,
|
|
|
63 |
"<s_date>": 57529,
|
64 |
"<s_delivery_contact>": 57567,
|
65 |
"<s_delivery_contact_person>": 57618,
|
@@ -68,6 +73,7 @@
|
|
68 |
"<s_document_no>": 57592,
|
69 |
"<s_document_type>": 57527,
|
70 |
"<s_dropoff point>": 57589,
|
|
|
71 |
"<s_dropoff_point>": 57547,
|
72 |
"<s_header>": 57525,
|
73 |
"<s_iitcdip>": 57523,
|
|
|
8 |
"</s_customer_no>": 57595,
|
9 |
"</s_customer_phone_no>": 57570,
|
10 |
"</s_customer_pin>": 57556,
|
11 |
+
"</s_customer_reference>": 57629,
|
12 |
"</s_customer_reference_no>": 57609,
|
13 |
"</s_cutomer_no>": 57599,
|
14 |
+
"</s_cutomer_pin>": 57627,
|
15 |
"</s_date>": 57530,
|
16 |
"</s_delivery_contact>": 57568,
|
17 |
"</s_delivery_contact_person>": 57619,
|
|
|
20 |
"</s_document_no>": 57593,
|
21 |
"</s_document_type>": 57528,
|
22 |
"</s_dropoff point>": 57590,
|
23 |
+
"</s_dropoff>": 57625,
|
24 |
"</s_dropoff_point>": 57548,
|
25 |
"</s_header>": 57526,
|
26 |
"</s_invoice_no>": 57576,
|
|
|
61 |
"<s_customer_no>": 57594,
|
62 |
"<s_customer_phone_no>": 57569,
|
63 |
"<s_customer_pin>": 57555,
|
64 |
+
"<s_customer_reference>": 57628,
|
65 |
"<s_customer_reference_no>": 57608,
|
66 |
"<s_cutomer_no>": 57598,
|
67 |
+
"<s_cutomer_pin>": 57626,
|
68 |
"<s_date>": 57529,
|
69 |
"<s_delivery_contact>": 57567,
|
70 |
"<s_delivery_contact_person>": 57618,
|
|
|
73 |
"<s_document_no>": 57592,
|
74 |
"<s_document_type>": 57527,
|
75 |
"<s_dropoff point>": 57589,
|
76 |
+
"<s_dropoff>": 57624,
|
77 |
"<s_dropoff_point>": 57547,
|
78 |
"<s_header>": 57525,
|
79 |
"<s_iitcdip>": 57523,
|
tokenizer.json
CHANGED
@@ -979,6 +979,60 @@
|
|
979 |
"rstrip": false,
|
980 |
"normalized": true,
|
981 |
"special": false
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
982 |
}
|
983 |
],
|
984 |
"normalizer": {
|
|
|
979 |
"rstrip": false,
|
980 |
"normalized": true,
|
981 |
"special": false
|
982 |
+
},
|
983 |
+
{
|
984 |
+
"id": 57624,
|
985 |
+
"content": "<s_dropoff>",
|
986 |
+
"single_word": false,
|
987 |
+
"lstrip": false,
|
988 |
+
"rstrip": false,
|
989 |
+
"normalized": true,
|
990 |
+
"special": false
|
991 |
+
},
|
992 |
+
{
|
993 |
+
"id": 57625,
|
994 |
+
"content": "</s_dropoff>",
|
995 |
+
"single_word": false,
|
996 |
+
"lstrip": false,
|
997 |
+
"rstrip": false,
|
998 |
+
"normalized": true,
|
999 |
+
"special": false
|
1000 |
+
},
|
1001 |
+
{
|
1002 |
+
"id": 57626,
|
1003 |
+
"content": "<s_cutomer_pin>",
|
1004 |
+
"single_word": false,
|
1005 |
+
"lstrip": false,
|
1006 |
+
"rstrip": false,
|
1007 |
+
"normalized": true,
|
1008 |
+
"special": false
|
1009 |
+
},
|
1010 |
+
{
|
1011 |
+
"id": 57627,
|
1012 |
+
"content": "</s_cutomer_pin>",
|
1013 |
+
"single_word": false,
|
1014 |
+
"lstrip": false,
|
1015 |
+
"rstrip": false,
|
1016 |
+
"normalized": true,
|
1017 |
+
"special": false
|
1018 |
+
},
|
1019 |
+
{
|
1020 |
+
"id": 57628,
|
1021 |
+
"content": "<s_customer_reference>",
|
1022 |
+
"single_word": false,
|
1023 |
+
"lstrip": false,
|
1024 |
+
"rstrip": false,
|
1025 |
+
"normalized": true,
|
1026 |
+
"special": false
|
1027 |
+
},
|
1028 |
+
{
|
1029 |
+
"id": 57629,
|
1030 |
+
"content": "</s_customer_reference>",
|
1031 |
+
"single_word": false,
|
1032 |
+
"lstrip": false,
|
1033 |
+
"rstrip": false,
|
1034 |
+
"normalized": true,
|
1035 |
+
"special": false
|
1036 |
}
|
1037 |
],
|
1038 |
"normalizer": {
|
tokenizer_config.json
CHANGED
@@ -855,6 +855,54 @@
|
|
855 |
"rstrip": false,
|
856 |
"single_word": false,
|
857 |
"special": false
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
858 |
}
|
859 |
},
|
860 |
"additional_special_tokens": [
|
|
|
855 |
"rstrip": false,
|
856 |
"single_word": false,
|
857 |
"special": false
|
858 |
+
},
|
859 |
+
"57624": {
|
860 |
+
"content": "<s_dropoff>",
|
861 |
+
"lstrip": false,
|
862 |
+
"normalized": true,
|
863 |
+
"rstrip": false,
|
864 |
+
"single_word": false,
|
865 |
+
"special": false
|
866 |
+
},
|
867 |
+
"57625": {
|
868 |
+
"content": "</s_dropoff>",
|
869 |
+
"lstrip": false,
|
870 |
+
"normalized": true,
|
871 |
+
"rstrip": false,
|
872 |
+
"single_word": false,
|
873 |
+
"special": false
|
874 |
+
},
|
875 |
+
"57626": {
|
876 |
+
"content": "<s_cutomer_pin>",
|
877 |
+
"lstrip": false,
|
878 |
+
"normalized": true,
|
879 |
+
"rstrip": false,
|
880 |
+
"single_word": false,
|
881 |
+
"special": false
|
882 |
+
},
|
883 |
+
"57627": {
|
884 |
+
"content": "</s_cutomer_pin>",
|
885 |
+
"lstrip": false,
|
886 |
+
"normalized": true,
|
887 |
+
"rstrip": false,
|
888 |
+
"single_word": false,
|
889 |
+
"special": false
|
890 |
+
},
|
891 |
+
"57628": {
|
892 |
+
"content": "<s_customer_reference>",
|
893 |
+
"lstrip": false,
|
894 |
+
"normalized": true,
|
895 |
+
"rstrip": false,
|
896 |
+
"single_word": false,
|
897 |
+
"special": false
|
898 |
+
},
|
899 |
+
"57629": {
|
900 |
+
"content": "</s_customer_reference>",
|
901 |
+
"lstrip": false,
|
902 |
+
"normalized": true,
|
903 |
+
"rstrip": false,
|
904 |
+
"single_word": false,
|
905 |
+
"special": false
|
906 |
}
|
907 |
},
|
908 |
"additional_special_tokens": [
|