-1

当我使用以下代码读取 CSV 标头时

def  read_header(gram):
    CSV_tag_read = csv.reader(open("Dataset/MALE_Training/"+str(gram)+"/"+str(gram)+".csv","rb"),delimiter='"')
    header=CSV_tag_read.next()

标题(csv文件的第一行)如下

Sample1"('CC', 'CD')"('CD', 'DT')"('DT', 'EX')"('EX', 'IN')"('IN', 'JJ')"('JJ', 'JJR')"('JJR', 'JJS')"('JJS', 'MD')"('MD', 'NN')"('NN', 'NNS')"('NNS', 'PRP')"('PRP', 'RB')"('RB', 'RBR')"('RBR', 'RP')"('RP', 'TO')"('TO', 'VB')"('VB', 'VBD')"('VBD', 'VBG')"('VBG', 'VBN')"('VBN', 'VBP')"('VBP', 'VBZ')"('VBZ', 'WDT')"('WDT', 'WP')"('WP', 'WRB')

我希望我的输出列表包含

['Sample1', '(CC, CD)', '(CD, DT)', '(DT, EX)', '(EX, IN)', '(IN, JJ)', '(JJ, JJR)', '(JJR, JJS)', '(JJS, MD)', '(MD, NN)', '(NN, NNS)', '(NNS, PRP)', '(PRP, RB)', '(RB, RBR)', '(RBR, RP)', '(RP, TO)', '(TO, VB)', '(VB, VBD)', '(VBD, VBG)', '(VBG, VBN)', '(VBN, VBP)', '(VBP, VBZ)', '(VBZ, WDT)', '(WDT, WP)', '(WP, WRB)']

4

1 回答 1

6

使用ast.literal_eval

>>> import ast
>>> a = "('TO', 'RP', 'TO')"
>>> b = ast.literal_eval(a)
>>> b
('TO', 'RP', 'TO')
>>> b[0]
'TO'

或者

>>> [x.strip("' ") for x in a.strip('()').split(',')]
['TO', 'RP', 'TO']

更新的答案对应于更新的问题:

with open('/path/to/csv-file.csv') as f:
    reader = csv.reader(f, delimiter='"')
    header = [column.replace("'", "") for column in header]
于 2013-11-02T05:28:35.257 回答