diff --git a/gazpy/gazetteer/geodict.py b/gazpy/gazetteer/geodict.py index 9b9061c94e0be2d08edbcbe7093307992b719032..aac2c4d3168775c564dc36b2411899bea9d4aec4 100644 --- a/gazpy/gazetteer/geodict.py +++ b/gazpy/gazetteer/geodict.py @@ -2,7 +2,8 @@ from .base import Base, parse_label2, return_on_failure - +import jellyfish +from ..helpers import is_date class Geodict(Base): """""" @@ -35,7 +36,12 @@ class Geodict(Base): sorted_by=self.score_field, sized=True, size=n) res = self.to_element(self.es_client.search("gazetteer", "place", query)) - return res + + res_filtered = [] + for el in res: + if not jellyfish.jaro_winkler(el.label.lang,label) < 0.5: + res_filtered.append(el) + return res_filtered except Exception as e: return [] @@ -51,7 +57,13 @@ class Geodict(Base): regexp_value=".* ({0}) .*".format(alias), field="aliases", value=alias, sorted=score, sorted_by=self.score_field, sized=True, size=n) - return res + res_filtered = [] + for el in res: + for al in el.alialiases.lang: + if not jellyfish.jaro_winkler(al, alias) < 0.5: + res_filtered.append(el) + break + return res_filtered except : return [] diff --git a/gazpy/helpers.py b/gazpy/helpers.py index d3f692bfd059a052b7dd782089358cd5e06ec74a..d0c943dc7cdcc0469454ab69516558ed276e7a5a 100644 --- a/gazpy/helpers.py +++ b/gazpy/helpers.py @@ -1,3 +1,3 @@ # coding = utf-8 -import numpy as np \ No newline at end of file +import numpy as np