如果列由雙引號包圍,它正常工作與內部逗號。 它會抱怨,如果它是由單引號
這裏包圍不匹配長度蜘蛛代碼:
# -*- coding: utf-8 -*-
from scrapy.spider import Spider
from scrapy.selector import Selector
from stackoverflow23429315.items import DemoItem
from scrapy.contrib.spiders import CSVFeedSpider
from scrapy import log
class DmozSpider(CSVFeedSpider):
name = 'csvFeedTest'
start_urls = ['file:////home/vagrant/labs/stackoverflow23429315/test.csv']
delimiter = ','
headers = ['id', 'name', 'address1', 'address2', 'email']
def parse_row(self, response, row):
log.msg('Hi, this is a row!: %r' % row)
item = DemoItem()
item['id'] = row['id']
item['name'] = row['name']
item['address1'] = row['address1']
item['address2'] = row['address2']
item['email'] = row['email']
return item
項目類:
from scrapy.item import Item, Field
class DemoItem(Item):
id = Field()
name = Field()
address1 = Field()
address2 = Field()
email = Field()
測試CSV文件:
1,"John, Doe","1234 Main Street, APT A","2nd Floor",[email protected]
2,"John2, Doe","1234 Main Street, APT A","2nd Floor",[email protected]
3,'John3, Doe','1234 Main Street, APT A','2nd Floor',[email protected]
4,'John4, Doe','1234 Main Street, APT A','2nd Floor',[email protected]