Spaces:
Runtime error
Runtime error
update docs and rename variables.
Browse files- iliauniiccocrevaluation.py +15 -19
iliauniiccocrevaluation.py
CHANGED
@@ -42,17 +42,17 @@ Args:
|
|
42 |
predictions: list of OCR detections in FiftyOne dataset format.
|
43 |
references: list of OCR detections in FiftyOne dataset format.
|
44 |
Returns:
|
45 |
-
evaluation_results:
|
46 |
Examples:
|
47 |
Examples should be written in doctest format, and should illustrate how
|
48 |
to use the function.
|
49 |
|
50 |
>>> dataset = load_dataset("anz2/iliauni_icc_georgian_ocr", use_auth_token="<auth token here>")
|
51 |
>>> sample = dataset['test'][0]
|
52 |
-
>>> ocr_evaluator = evaluate.load("iliauniiccocrevaluation")
|
53 |
-
>>> results = ocr_evaluator.
|
54 |
-
>>> print(results)
|
55 |
-
|
56 |
"""
|
57 |
|
58 |
|
@@ -117,9 +117,7 @@ class IliauniIccOCREvaluation(evaluate.Metric):
|
|
117 |
),
|
118 |
"image": datasets.Image()
|
119 |
}
|
120 |
-
)
|
121 |
-
length=-1,
|
122 |
-
id=None
|
123 |
),
|
124 |
"references": datasets.Sequence(
|
125 |
feature=datasets.Features(
|
@@ -167,17 +165,15 @@ class IliauniIccOCREvaluation(evaluate.Metric):
|
|
167 |
),
|
168 |
"image": datasets.Image()
|
169 |
}
|
170 |
-
)
|
171 |
-
|
172 |
-
id=None
|
173 |
-
),
|
174 |
}
|
175 |
),
|
176 |
# Homepage of the module for documentation
|
177 |
-
homepage="
|
178 |
# Additional links to the codebase or references
|
179 |
-
codebase_urls=["
|
180 |
-
reference_urls=[
|
181 |
)
|
182 |
|
183 |
def _download_and_prepare(self, dl_manager):
|
@@ -189,12 +185,12 @@ class IliauniIccOCREvaluation(evaluate.Metric):
|
|
189 |
"""Returns the scores"""
|
190 |
|
191 |
assert len(predictions) == len(references)
|
192 |
-
|
193 |
for prediction, reference in zip(predictions, references):
|
194 |
prediction_df = FiftyOneOcr(data=prediction).get_word_annotations(convert_bbox=True)
|
195 |
reference_df = FiftyOneOcr(data=reference).get_word_annotations(convert_bbox=True)
|
196 |
|
197 |
-
|
198 |
-
|
199 |
|
200 |
-
return
|
|
|
42 |
predictions: list of OCR detections in FiftyOne dataset format.
|
43 |
references: list of OCR detections in FiftyOne dataset format.
|
44 |
Returns:
|
45 |
+
evaluation_results: list of dictionaries containing multiple metrics
|
46 |
Examples:
|
47 |
Examples should be written in doctest format, and should illustrate how
|
48 |
to use the function.
|
49 |
|
50 |
>>> dataset = load_dataset("anz2/iliauni_icc_georgian_ocr", use_auth_token="<auth token here>")
|
51 |
>>> sample = dataset['test'][0]
|
52 |
+
>>> ocr_evaluator = evaluate.load("anz2/iliauniiccocrevaluation")
|
53 |
+
>>> results = ocr_evaluator._compute(predictions=[sample], references=[sample])
|
54 |
+
>>> print(results[0].keys())
|
55 |
+
dict_keys(['accuracy', 'precision', 'recall', 'f1', 'levenstein_distances_stats', 'levenstein_similarities_stats', 'iou_stats', 'edit_operations_stats'])
|
56 |
"""
|
57 |
|
58 |
|
|
|
117 |
),
|
118 |
"image": datasets.Image()
|
119 |
}
|
120 |
+
)
|
|
|
|
|
121 |
),
|
122 |
"references": datasets.Sequence(
|
123 |
feature=datasets.Features(
|
|
|
165 |
),
|
166 |
"image": datasets.Image()
|
167 |
}
|
168 |
+
)
|
169 |
+
)
|
|
|
|
|
170 |
}
|
171 |
),
|
172 |
# Homepage of the module for documentation
|
173 |
+
homepage="",
|
174 |
# Additional links to the codebase or references
|
175 |
+
codebase_urls=["https://github.com/IliaUni-ICC/ocr_evaluation"],
|
176 |
+
reference_urls=[]
|
177 |
)
|
178 |
|
179 |
def _download_and_prepare(self, dl_manager):
|
|
|
185 |
"""Returns the scores"""
|
186 |
|
187 |
assert len(predictions) == len(references)
|
188 |
+
results = []
|
189 |
for prediction, reference in zip(predictions, references):
|
190 |
prediction_df = FiftyOneOcr(data=prediction).get_word_annotations(convert_bbox=True)
|
191 |
reference_df = FiftyOneOcr(data=reference).get_word_annotations(convert_bbox=True)
|
192 |
|
193 |
+
result = evaluate_by_words(prediction_df, reference_df, pref1="Pred_", pref2="Tar_")
|
194 |
+
results.append(result)
|
195 |
|
196 |
+
return results
|