chore: fix $ and €
Browse files
anonymize_file_clear.py
CHANGED
@@ -23,7 +23,8 @@ def load_models():
|
|
23 |
|
24 |
|
25 |
def anonymize_with_cml(text, embeddings_model, tokenizer, cml_ner_model):
|
26 |
-
token_pattern = r"(\b[\w\.\/\-@]+\b|[\s,.!?;:'\"-]+)"
|
|
|
27 |
tokens = re.findall(token_pattern, text)
|
28 |
uuid_map = {}
|
29 |
processed_tokens = []
|
|
|
23 |
|
24 |
|
25 |
def anonymize_with_cml(text, embeddings_model, tokenizer, cml_ner_model):
|
26 |
+
token_pattern = r"(\b[\w\.\/\-@]+\b|[\s,.!?;:'\"-]+|\$\d+(?:\.\d+)?|\€\d+(?:\.\d+)?)"
|
27 |
+
|
28 |
tokens = re.findall(token_pattern, text)
|
29 |
uuid_map = {}
|
30 |
processed_tokens = []
|
files/anonymized_document.txt
CHANGED
@@ -1,11 +1 @@
|
|
1 |
-
|
2 |
-
|
3 |
-
Date: c0239016 4f1ec317, e1bfa3a5
|
4 |
-
|
5 |
-
Scope: 7166a872 agrees to provide graphic design services to 7f2310e8 for the creation of a company logo.
|
6 |
-
|
7 |
-
Amount: 7f2310e8 agrees to pay 7166a872 500 upon completion and delivery of the logo.
|
8 |
-
|
9 |
-
Deadline: The logo design must be completed and delivered to 7f2310e8 within 14 days of the contract signing date.
|
10 |
-
|
11 |
-
Payment terms: 7166a872's international bank account N: df667faf
|
|
|
1 |
+
14 days and 2c68f2f2
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
files/mapping_clear_to_anonymized.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f05e1dd38586c17aed4200febefb058205bd510f9b4b7eba5724fbf05ad78d5d
|
3 |
+
size 77
|
files/mapping_doc_embedding_path.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b119b5428b6f0740ea7201428cc34ebdf9b893c99613afa40e58dc46586a3ed
|
3 |
+
size 16674
|
files/original_document.txt
CHANGED
@@ -4,8 +4,8 @@ Date: February 06, 2000
|
|
4 |
|
5 |
Scope: Kate agrees to provide graphic design services to David for the creation of a company logo.
|
6 |
|
7 |
-
Amount: David agrees to pay Kate $
|
8 |
|
9 |
-
Deadline: The logo design must be completed and delivered to David within 14
|
10 |
|
11 |
Payment terms: Kate's international bank account N°: IL150120690000003111111
|
|
|
4 |
|
5 |
Scope: Kate agrees to provide graphic design services to David for the creation of a company logo.
|
6 |
|
7 |
+
Amount: David agrees to pay Kate $1500 upon completion and delivery of the logo.
|
8 |
|
9 |
+
Deadline: The logo design must be completed and delivered to David within 14-days of the contract signing date.
|
10 |
|
11 |
Payment terms: Kate's international bank account N°: IL150120690000003111111
|
files/original_document_uuid_mapping.json
CHANGED
@@ -1,8 +1,3 @@
|
|
1 |
{
|
2 |
-
"
|
3 |
-
"2000": "e1bfa3a5",
|
4 |
-
"David": "7f2310e8",
|
5 |
-
"February": "c0239016",
|
6 |
-
"IL150120690000003111111": "df667faf",
|
7 |
-
"Kate": "7166a872"
|
8 |
}
|
|
|
1 |
{
|
2 |
+
"$500": "2c68f2f2"
|
|
|
|
|
|
|
|
|
|
|
3 |
}
|