import re
import nltk
import pandas as pd
from nltk.chunk import RegexpParser
from textblob import TextBlob
data = open('data.txt', 'r')
data = data.read()
# region Fetch Account Type
chunkData = r"""DataChunk: {(<NNP><NNP>+<CD>+)}
}<JJ|IN|DT|TO>+{"""
lines = [line for line in open('data.txt')]
lstLines=data.split('|')
dataLines=[]
for lines in lstLines:
dataLines=lines.split("\n")
for line in dataLines:
if 'Data' in line:
DataTags = TextBlob(line).tags
Datachunker = RegexpParser(chunkData)
Datachunked = Datachunker.parse(DataTags)
for chunk in Datachunked:
if type(chunk) == nltk.tree.Tree and chunk.label() == "DataChunk":
DatachunkedLst = chunk.leaves()
Datachunked = [leaf[0] for leaf in DatachunkedLst if leaf[1] == 'CD']
Data = '/'.join(Datachunked)
Error:if type(chunk) == nltk.tree.Tree and chunk.label() == "DataChunk": TypeError: 'str' object is not callable「海峽」對象不在NLTK調用
但是我能夠打印chunk.label()
你好維奈,請考慮寫你想達到的目標。否則,我們只能猜測。 –
請提供一些數據,你是從的data.txt文件 –
讀你有沒有通過任何機會,一個字符串值賦給一個名爲'type'變量?如'type =「無概念」'? – lenz