please help me to correct my code:
import scrapy class QuotesSpider(scrapy.Spider):
name="popularity"
def start_requests(self):
with open('/home/jihane/Téléchargements/odm.csv/org.csv', 'rb') as f:
list=[]
for line in f.readlines():
array = line.split(',')
url = array[9]
list.append(url)
list.pop(0)
list for url in list: yield scrapy.Request(url=url, callback=self.parse)
def parse(self, response):
y={}
page=response.url
societe= response.url.split("/")[-1]
y={"url":page,"name":societe}
for t, v in zip(response.css("span.ProfileNav-label::text"),response.css("span.ProfileNav-value::text")):
t=t.extract()
v=v.extract()
y[t]=v
yield y
first :) pls format your code so it makes sense :)
second please tell the exact issue you have :) so we can help you :)
This code worked for me:
def start\\_requests(self): with open('csvfile', 'rb') as f: list=[] for line in f.readlines(): array = line.split(',') url = array[9] list.append(url) list.pop(0) for url in list: if url != "": yield scrapy.Request(url=url, callback=self.parse) def parse(self, response): y={} page=response.url societe= response.url.split("/")[-1] y={"url":page,"name":societe} #url and name of the entreprise for t, v in zip(response.css("span.ProfileNav-label::text"),response.css("span.ProfileNav-value::text")): t = t.extract() #label v = v.extract() #valeur label y[t]=v