import spacy
from spacymoji import Emoji
def test():
nlp = spacy.load('en_core_web_sm')
emoji = Emoji(nlp, merge_spans=True)
nlp.add_pipe(emoji, first=True)
doc = nlp(
'Word!👍🏿')
for token in doc:
print (token)
doc = nlp(
'Word! 👍🏿')
for token in doc:
print(token)
doc = nlp(
'Word!👍')
for token in doc:
print(token)
return doc
Shows the problem. "Word!" is not correctly split into "Word" and "!", when the thumbs up has a dark skin tone modifier.