Hiveurban commited on
Commit
390d738
·
verified ·
1 Parent(s): a774a0e

Upload handler.py with huggingface_hub

Browse files
Files changed (2) hide show
  1. .gitattributes +1 -0
  2. handler.py +3 -40
.gitattributes CHANGED
@@ -34,3 +34,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  vocab.txt filter=lfs diff=lfs merge=lfs -text
 
 
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  vocab.txt filter=lfs diff=lfs merge=lfs -text
37
+ handler.py filter=lfs diff=lfs merge=lfs -text
handler.py CHANGED
@@ -1,40 +1,3 @@
1
- from typing import Dict, List, Any
2
- from transformers import AutoModel, AutoTokenizer
3
-
4
-
5
- class EndpointHandler:
6
- def __init__(self, path="."):
7
- self.tokenizer = AutoTokenizer.from_pretrained(path)
8
- self.model = AutoModel.from_pretrained(
9
- path,
10
- trust_remote_code=True,
11
- do_syntax=True, do_prefix=False, do_morph=False, do_ner=True, do_lex=True
12
- )
13
- self.model.eval()
14
-
15
- def __call__(self, data: Dict[str, Any]) -> List[Dict[str, Any]]:
16
- """
17
- data args:
18
- inputs (:obj: `str` | `PIL.Image` | `np.array`)
19
- kwargs
20
- Return:
21
- A :obj:`list` | `dict`: will be serialized and returned
22
- """
23
- # return self.pipeline(data['inputs'])
24
- outputs = self.model.predict(data['inputs'], self.tokenizer, output_style='json')
25
- for i, output in enumerate(outputs):
26
- lem = ' '.join([x['lex'] for x in output['tokens']])
27
- ner = [
28
- {
29
- 'word': ' '.join([x['lex'] for x in output['tokens'][x['token_start']:x['token_end'] + 1]]),
30
- 'entity_group': x['label'],
31
- 'token_start': x['token_start'],
32
- 'token_end': x['token_end']
33
- }
34
- for x in output['ner_entities']
35
- ]
36
- outputs[i] = {
37
- 'lex': lem,
38
- 'ner': ner
39
- }
40
- return outputs
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26ce128baa792901b22cecfdd6a7dc783307e60d4b766dcd3aa4d1eaeb3a36d2
3
+ size 744148153