当前位置 : 主页 > 网页制作 > html >

爬取网易某只股票2017-01到2018-01的数据

来源:互联网 收集:自由互联 发布时间:2021-06-12
import urllib.request import re import urllib import csv from selenium import webdriver from lxml import etree import requestsx = 0header =[ ‘ 日期 ‘ , ‘ 开盘价 ‘ , ‘ 最高价 ‘ , ‘ 最低价 ‘ , ‘ 收盘价 ‘ , ‘
import urllib.request
import re
import urllib
import csv
from selenium import webdriver
from lxml import  etree
import requests
x=0
header=[日期,开盘价,最高价,最低价,收盘价,涨跌额,涨跌幅,成交量,成交金额,振幅,换手率]
with open(C:\\Users\\lenovo\\Desktop\\mmm.csv, a+, newline=‘‘, encoding=utf-8) as f:
    writer = csv.writer(f)
    writer.writerow(header)
for i in range(2017,2019):
   url="http://quotes.money.163.com/trade/lsjysj_601939.html?year={}&season=".format(i)
   headers={ User-Agent:Mozilla/5.0 (Windows NT 6.1) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/63.0.3239.132 Safari/537.36}
   for k in range(1,5):
       ur=url+str(k)
       response=requests.get(ur,headers)
       html=etree.HTML(response.text)
       img=html.xpath(//tr[@class=""]/td)
       ok=html.xpath(//tr[@class="dbrow"]/td)
       x=x+1
       if x==6:
           break
       for i in range(len(img)-11,-1,-11):
           if img[i].text==2018-02-01or ok[i-11].text==2018-02-01:
               break
           data=list(img[j].text for j in range(i,i+11))
           data2 = list(ok[j-11].text for j in range(i, i + 11))
           with open(C:\\Users\\lenovo\\Desktop\\mmm.csv, a+, newline=‘‘, encoding=utf-8) as f:
               writer = csv.writer(f)
               writer.writerow(data)
               writer.writerow(data2)
上一篇:DOM Tree
下一篇:restful api的10个最佳实践
网友评论