anz2 commited on
Commit
bf694f7
1 Parent(s): 354cd04

update docs and rename variables.

Browse files
Files changed (1) hide show
  1. iliauniiccocrevaluation.py +15 -19
iliauniiccocrevaluation.py CHANGED
@@ -42,17 +42,17 @@ Args:
42
  predictions: list of OCR detections in FiftyOne dataset format.
43
  references: list of OCR detections in FiftyOne dataset format.
44
  Returns:
45
- evaluation_results: dictionary containing multiple metrics
46
  Examples:
47
  Examples should be written in doctest format, and should illustrate how
48
  to use the function.
49
 
50
  >>> dataset = load_dataset("anz2/iliauni_icc_georgian_ocr", use_auth_token="<auth token here>")
51
  >>> sample = dataset['test'][0]
52
- >>> ocr_evaluator = evaluate.load("iliauniiccocrevaluation")
53
- >>> results = ocr_evaluator.compute(references=[sample], predictions=[0, 1])
54
- >>> print(results)
55
- {'accuracy': 1.0}
56
  """
57
 
58
 
@@ -117,9 +117,7 @@ class IliauniIccOCREvaluation(evaluate.Metric):
117
  ),
118
  "image": datasets.Image()
119
  }
120
- ),
121
- length=-1,
122
- id=None
123
  ),
124
  "references": datasets.Sequence(
125
  feature=datasets.Features(
@@ -167,17 +165,15 @@ class IliauniIccOCREvaluation(evaluate.Metric):
167
  ),
168
  "image": datasets.Image()
169
  }
170
- ),
171
- length=-1,
172
- id=None
173
- ),
174
  }
175
  ),
176
  # Homepage of the module for documentation
177
- homepage="http://module.homepage",
178
  # Additional links to the codebase or references
179
- codebase_urls=["http://github.com/path/to/codebase/of/new_module"],
180
- reference_urls=["http://path.to.reference.url/new_module"]
181
  )
182
 
183
  def _download_and_prepare(self, dl_manager):
@@ -189,12 +185,12 @@ class IliauniIccOCREvaluation(evaluate.Metric):
189
  """Returns the scores"""
190
 
191
  assert len(predictions) == len(references)
192
- eval_results = []
193
  for prediction, reference in zip(predictions, references):
194
  prediction_df = FiftyOneOcr(data=prediction).get_word_annotations(convert_bbox=True)
195
  reference_df = FiftyOneOcr(data=reference).get_word_annotations(convert_bbox=True)
196
 
197
- eval_result = evaluate_by_words(prediction_df, reference_df, pref1="Pred_", pref2="Tar_")
198
- eval_results.append(eval_result)
199
 
200
- return eval_results
 
42
  predictions: list of OCR detections in FiftyOne dataset format.
43
  references: list of OCR detections in FiftyOne dataset format.
44
  Returns:
45
+ evaluation_results: list of dictionaries containing multiple metrics
46
  Examples:
47
  Examples should be written in doctest format, and should illustrate how
48
  to use the function.
49
 
50
  >>> dataset = load_dataset("anz2/iliauni_icc_georgian_ocr", use_auth_token="<auth token here>")
51
  >>> sample = dataset['test'][0]
52
+ >>> ocr_evaluator = evaluate.load("anz2/iliauniiccocrevaluation")
53
+ >>> results = ocr_evaluator._compute(predictions=[sample], references=[sample])
54
+ >>> print(results[0].keys())
55
+ dict_keys(['accuracy', 'precision', 'recall', 'f1', 'levenstein_distances_stats', 'levenstein_similarities_stats', 'iou_stats', 'edit_operations_stats'])
56
  """
57
 
58
 
 
117
  ),
118
  "image": datasets.Image()
119
  }
120
+ )
 
 
121
  ),
122
  "references": datasets.Sequence(
123
  feature=datasets.Features(
 
165
  ),
166
  "image": datasets.Image()
167
  }
168
+ )
169
+ )
 
 
170
  }
171
  ),
172
  # Homepage of the module for documentation
173
+ homepage="",
174
  # Additional links to the codebase or references
175
+ codebase_urls=["https://github.com/IliaUni-ICC/ocr_evaluation"],
176
+ reference_urls=[]
177
  )
178
 
179
  def _download_and_prepare(self, dl_manager):
 
185
  """Returns the scores"""
186
 
187
  assert len(predictions) == len(references)
188
+ results = []
189
  for prediction, reference in zip(predictions, references):
190
  prediction_df = FiftyOneOcr(data=prediction).get_word_annotations(convert_bbox=True)
191
  reference_df = FiftyOneOcr(data=reference).get_word_annotations(convert_bbox=True)
192
 
193
+ result = evaluate_by_words(prediction_df, reference_df, pref1="Pred_", pref2="Tar_")
194
+ results.append(result)
195
 
196
+ return results