我希望输出为["good customer service","great ambience"]
,但我得到["good customer","good customer service","great ambience"]
,因为模式也与良好的客户匹配,但是这句话没有任何意义。如何删除此类重复项
import spacy
from spacy.matcher import Matcher
nlp = spacy.load("en_core_web_sm")
doc = nlp("good customer service and great ambience")
matcher = Matcher(nlp.vocab)
# Create a pattern matching two tokens: adjective followed by one or more noun
pattern = [{"POS": 'ADJ'},{"POS": 'NOUN',"OP": '+'}]
matcher.add("ADJ_NOUN_PATTERN",None,pattern)
matches = matcher(doc)
print("Matches:",[doc[start:end].text for match_id,start,end in matches])