Skip to content

Commit

Permalink
Merge pull request #127 from gyorilab/safer-prefix-index
Browse files Browse the repository at this point in the history
Improve safety of NER build
  • Loading branch information
bgyori authored Feb 6, 2024
2 parents e4be647 + 7b72202 commit 24cfa02
Show file tree
Hide file tree
Showing 2 changed files with 6 additions and 0 deletions.
4 changes: 4 additions & 0 deletions gilda/grounder.py
Original file line number Diff line number Diff line change
Expand Up @@ -111,7 +111,11 @@ def __init__(
def _build_prefix_index(self):
prefix_index = defaultdict(set)
for norm_term in self.entries:
if not norm_term:
continue
parts = norm_term.split()
if not parts:
continue
prefix_index[parts[0]].add(len(parts))
self.prefix_index = dict(prefix_index)

Expand Down
2 changes: 2 additions & 0 deletions gilda/term.py
Original file line number Diff line number Diff line change
Expand Up @@ -52,6 +52,8 @@ def __init__(self, norm_text, text, db, id, entry_name, status, source,
organism=None, source_db=None, source_id=None):
if not text:
raise ValueError('Text for Term cannot be empty')
if not norm_text.strip():
raise ValueError('Normalized text for Term cannot be empty')
self.norm_text = norm_text
self.text = text
self.db = db
Expand Down

0 comments on commit 24cfa02

Please sign in to comment.