Skip to content

Commit

Permalink
Merge pull request #3 from graphext/extension_check
Browse files Browse the repository at this point in the history
Allow forced registration of extension by default
  • Loading branch information
ines authored Apr 9, 2019
2 parents c588f1f + cc9031f commit 381d20a
Show file tree
Hide file tree
Showing 2 changed files with 9 additions and 7 deletions.
1 change: 1 addition & 0 deletions .gitignore
Original file line number Diff line number Diff line change
@@ -1,5 +1,6 @@
# Byte-compiled / optimized / DLL files
__pycache__/
.pytest_cache/
*.py[cod]
*$py.class

Expand Down
15 changes: 8 additions & 7 deletions spacymoji/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -37,7 +37,8 @@ class Emoji(object):
name = 'emoji'

def __init__(self, nlp, merge_spans=True, lookup={}, pattern_id='EMOJI',
attrs=('has_emoji', 'is_emoji', 'emoji_desc', 'emoji')):
attrs=('has_emoji', 'is_emoji', 'emoji_desc', 'emoji'),
force_extension=True):
"""Initialise the pipeline component.
nlp (Language): The shared nlp object. Used to initialise the matcher
Expand All @@ -59,12 +60,12 @@ def __init__(self, nlp, merge_spans=True, lookup={}, pattern_id='EMOJI',
emoji_patterns = list(nlp.tokenizer.pipe(EMOJI.keys()))
self.matcher.add(pattern_id, None, *emoji_patterns)
# Add attributes
Doc.set_extension(self._has_emoji, getter=self.has_emoji)
Doc.set_extension(self._emoji, getter=self.iter_emoji)
Span.set_extension(self._has_emoji, getter=self.has_emoji)
Span.set_extension(self._emoji, getter=self.iter_emoji)
Token.set_extension(self._is_emoji, default=False)
Token.set_extension(self._emoji_desc, getter=self.get_emoji_desc)
Doc.set_extension(self._has_emoji, getter=self.has_emoji, force=force_extension)
Doc.set_extension(self._emoji, getter=self.iter_emoji, force=force_extension)
Span.set_extension(self._has_emoji, getter=self.has_emoji, force=force_extension)
Span.set_extension(self._emoji, getter=self.iter_emoji, force=force_extension)
Token.set_extension(self._is_emoji, default=False, force=force_extension)
Token.set_extension(self._emoji_desc, getter=self.get_emoji_desc, force=force_extension)

def __call__(self, doc):
"""Apply the pipeline component to a `Doc` object.
Expand Down

0 comments on commit 381d20a

Please sign in to comment.