python快速接手别人的代码_Python 爬虫代码,网上找的别人的,但是报错,求高手指点...
本帖最后由 Ly102 于 2020-9-9 17:06 编辑
代码如下:
import os
import random
import json
import time
import ssl
import pandas as pd
import requests
import urllib3
#此文件我已上传到我的下载
from utils.read_write import writeOneJSON
ssl._create_default_https_context = ssl._create_unverified_context
header = {
'Host': 'ytz.winshangdata.com',
'appType': 'ytzapp',
'Connection': 'keep-alive',
'Upgrade-Insecure-Requests': '1',
'platform': 'android',
'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8',
'Accept-Encoding': 'gzip, deflate',
'Accept-Language': 'zh-CN,en-US;q=0.9',
'X-Requested-With': 'com.winshangdata.ytz',
'uuid': '860000000229756,860000000229756',
'token': 'eyJhbGciOiJIUzI1NiJ9.eyJzdWIiOiJ7XCJleHBpclwiOjE1NzQzNDAxNDYxNTksXCJ1aWRcIjpcIkphY2tzb24yMjJcIixcInV1aWRcIjpcIjE1ODY5NzQyMTA4XCJ9IiwiaWF0IjoxNTczODIxNzQ2fQ.bQVKB1khKYu5LI9Do4zzkpqJd9xGDh5eNIJqcC7CORw',
'Cookie': 'auth={%22token%22:%22eyJhbGciOiJIUzI1NiJ9.eyJzdWIiOiJ7XCJleHBpclwiOjE1NzM3NDg0OTE4NDEsXCJ1aWRcIjpcIkphY2tzb24yMjJcIixcInV1aWRcIjpcIjE1ODY5NzQyMTA4XCJ9IiwiaWF0IjoxNTczMjMwMDkxfQ.vtCnWjWyM5tD8lmb2lWzhLfKzg4mTw-9W8mFmzdeVq8%22%2C%22refreshToken%22:%22eyJhbGciOiJIUzI1NiJ9.eyJzdWIiOiJ7XCJleHBpclwiOjE1NzQxMTkxMjQ1NDUsXCJ1aWRcIjpcIkphY2tzb24yMjJcIixcInV1aWRcIjpcIjE1ODY5NzQyMTA4XCJ9IiwiaWF0IjoxNTczMjMwMDkxfQ.7RrT9bIUO06wRDVsjHG_eSLQKa2IaLvyX-qRHvAWY48%22%2C%22uid%22:%2215869742108%22%2C%22uuid%22:%22860000000229756%2C860000000229756%22}',
'User-Agent': 'Mozilla/5.0 (Linux; Android 7.1.1; OPPO A73t Build/N6F26Q; wv) AppleWebKit/537.36 (KHTML, like Gecko) Version/4.0 Chrome/62.0.3202.84 Mobile Safari/537.36 uni-app Html5Plus/1.0 (Immersed/18.0)'
}
def getProjectRadius(id, path):
url_getBrandNumVoList = "https://ytz.winshangdata.com/mapapi/api/project/getBrandNumVoList"
getKilometerSupportingFacilitiesCount = "https://ytz.winshangdata.com/mapapi/api/project/getKilometerSupportingFacilitiesCount"
getProjectPeripheryXBaoGaoCtr = "https://ytz.winshangdata.com/mapapi/api/project/getProjectPeripheryXBaoGaoCtr"
getProjectZhouBianRfCtr = "https://ytz.winshangdata.com/mapapi/api/project/getProjectZhouBianRfCtr"
getProjectKmListCtr = "https://ytz.winshangdata.com/mapapi/api/project/getProjectKmListCtr"
BasicInformationCtr = "https://ytz.winshangdata.com/mapapi/api/project/getProjectBasicInformationCtr"
try:
formdata = {
"projectId": id,
"radius": '3',
"type": '1',
}
urllib3.disable_warnings()
response = requests.post(url_getBrandNumVoList, json=formdata, headers=header, verify=False)
url_getBrandNumVoList = json.loads(response.text)
writeOneJSON(url_getBrandNumVoList,
path + '\\' + str(id) + '_' + 'getBrandNumVoList_radius_3.json')
formdata = {
"projectId": id,
"radius": '3',
}
response = requests.post(BasicInformationCtr, json=formdata, headers=header, verify=False)
BasicInformationCtr = json.loads(response.text)
writeOneJSON(BasicInformationCtr, path + '\\' + str(id) + '_' + 'BasicInformationCtr_radius_3.json')
response = requests.post(getKilometerSupportingFacilitiesCount, json=formdata, headers=header, verify=False)
data = json.loads(response.text)
writeOneJSON(data, path + '\\' + str(id) + '_' + 'getKilometerSupportingFacilitiesCount_radius_3.json')
response = requests.post(getProjectPeripheryXBaoGaoCtr, json=formdata, headers=header, verify=False)
data = json.loads(response.text)
writeOneJSON(data, path + '\\' + str(id) + '_' + 'getProjectPeripheryXBaoGaoCtr_radius_3.json')
response = requests.post(getProjectZhouBianRfCtr, json=formdata, headers=header, verify=False)
data = json.loads(response.text)
writeOneJSON(data, path + '\\' + str(id) + '_' + 'getProjectZhouBianRfCtr_radius_3.json')
response = requests.post(getProjectKmListCtr, json=formdata, headers=header, verify=False)
data = json.loads(response.text)
writeOneJSON(data, path + '\\' + str(id) + '_' + 'getProjectKmListCtr_radius_3.json')
return BasicInformationCtr
except Exception as e:
print('getProjectRadius')
print(id)
print(path)
print(e)
def getLocationValueCtr(id, path, lon, lat):
url = "https://ytz.winshangdata.com/mapapi/api/project/getLocationValueCtr"
try:
formdata = {
"latitude": lat,
"longitude": lon,
"radius": radius,
}
urllib3.disable_warnings()
response = requests.post(url, json=formdata, headers=header, verify=False)
getLocationValueCtr = json.loads(response.text)
writeOneJSON(getLocationValueCtr, path + '\\' + str(id) + '_' + 'getLocationValueCtr_radius_3.json')
except Exception as e:
print('getLocationValueCtr')
print(id)
print(path)
print( e)
def getProject(id, path):
getYiQianYueList3_5_forYtz = "https://ytz.winshangdata.com/wsapi/project/getYiQianYueList3_5_forYtz"
coreRadiationScopeReport = "https://ytz.winshangdata.com/mapapi/api/project/coreRadiationScopeReport"
detailQianYueBrand3_6_forYtz = "https://ytz.winshangdata.com/wsapi/project/detailQianYueBrand3_6_forYtz"
getRadiationRangeCtr_url = "https://ytz.winshangdata.com/mapapi/api/project/getRadiationRangeCtr"
detailZhaoShangXuQiu = "https://ytz.winshangdata.com/wsapi/project/detailZhaoShangXuQiu"
try:
formdata = {
"floor": '',
"industryType_id": '1001',
"projectId": id,
}
urllib3.disable_warnings()
response = requests.post(getYiQianYueList3_5_forYtz, json=formdata, headers=header, verify=False)
data = json.loads(response.text)
writeOneJSON(data, path + '\\' + str(id) + '_' + 'getYiQianYueList3_5_forYtz.json')
formdata = {
"projectId": id,
}
response = requests.post(coreRadiationScopeReport, json=formdata, headers=header, verify=False)
data = json.loads(response.text)
writeOneJSON(data, path + '\\' + str(id) + '_' + 'coreRadiationScopeReport.json')
response = requests.post(detailQianYueBrand3_6_forYtz, json=formdata, headers=header, verify=False)
data = json.loads(response.text)
writeOneJSON(data, path + '\\' + str(id) + '_' + 'detailQianYueBrand3_6_forYtz.json')
response = requests.post(getRadiationRangeCtr_url, json=formdata, headers=header, verify=False)
data = json.loads(response.text)
writeOneJSON(data, path + '\\' + str(id) + '_' + 'getRadiationRangeCtr_url.json')
response = requests.post(detailZhaoShangXuQiu, json=formdata, headers=header, verify=False)
data = json.loads(response.text)
writeOneJSON(data, path + '\\' + str(id) + '_' + 'detailZhaoShangXuQiu.json')
except Exception as e:
print('getProject')
print(id)
print(path)
print(e)
def mall():
project_china = pd.read_csv(project_url,encoding='gbk')
for index,project in project_china.iterrows():
project = project_china.loc[index]
projectId = str(project[0])
projectName = project[1]
path = save_url + projectName
path = path.strip()
path = path.rstrip("\\")
isExists = os.path.exists(path)
if not isExists:
os.makedirs(path)
BasicInformationCtr =getProjectRadius(projectId, path)
getProject(projectId, path)
if BasicInformationCtr:
if BasicInformationCtr['data']:
lon = BasicInformationCtr['data']['longitude']
lat = BasicInformationCtr['data']['latitude']
getLocationValueCtr(projectId, path,lon,lat,3)
# getLocationValueCtr(projectId, path,lon,lat,5)
else:
print('以下项目基本数据为空')
print(projectId)
print(projectName)
def project_analysis():
for n,projectIdName in project_name_id.iterrows():
projectIdName = project_name_id.loc[n+2419]
projectId = int(projectIdName[0])
projectName = projectIdName[1]
path = save_url + projectName
path = path.strip()
path = path.rstrip("\\")
isExists = os.path.exists(path)
if not isExists:
os.makedirs(path)
BasicInformationCtr =getProjectRadius(projectId, path)
getProject(projectId, path)
if BasicInformationCtr:
if BasicInformationCtr['data']:
lon = BasicInformationCtr['data']['longitude']
lat = BasicInformationCtr['data']['latitude']
getLocationValueCtr(projectId, path,lon,lat,3)
# getLocationValueCtr(projectId, path,lon,lat,5)
else:
print('以下项目基本数据为空')
print(projectId)
print(projectName)
if __name__ == "__main__":
save_url = 'D:\da\\'
project_url = 'D:\dcInfo.csv'
project_name_id = pd.read_csv(project_url,encoding='gbk',error_bad_lines=False)
project_analysis()
# CommercialDistrict()
报错如下:
C:\Users\ASUS\AppData\Local\Programs\Python\Python38\python.exe E:/PyCharm/code/myfirstPython.py
Traceback (most recent call last):
File "E:/PyCharm/code/myfirstPython.py", line 184, in
project_name_id = pd.read_csv(project_url,encoding='gbk',error_bad_lines=False)
File "C:\Users\ASUS\AppData\Local\Programs\Python\Python38\lib\site-packages\pandas\io\parsers.py", line 686, in read_csv
return _read(filepath_or_buffer, kwds)
File "C:\Users\ASUS\AppData\Local\Programs\Python\Python38\lib\site-packages\pandas\io\parsers.py", line 452, in _read
parser = TextFileReader(fp_or_buf, **kwds)
File "C:\Users\ASUS\AppData\Local\Programs\Python\Python38\lib\site-packages\pandas\io\parsers.py", line 936, in __init__
self._make_engine(self.engine)
File "C:\Users\ASUS\AppData\Local\Programs\Python\Python38\lib\site-packages\pandas\io\parsers.py", line 1168, in _make_engine
self._engine = CParserWrapper(self.f, **self.options)
File "C:\Users\ASUS\AppData\Local\Programs\Python\Python38\lib\site-packages\pandas\io\parsers.py", line 1981, in __init__
src = open(src, "rb")
FileNotFoundError: [Errno 2] No such file or directory: 'D:\\dcInfo.csv'
谢谢高手指教一下
我在D盘手动创建了一个 dclnfo.csv 文件,还是报错,如下:
C:\Users\ASUS\AppData\Local\Programs\Python\Python38\python.exe E:/PyCharm/code/myfirstPython.py
Traceback (most recent call last):
File "E:/PyCharm/code/myfirstPython.py", line 184, in
project_name_id = pd.read_csv(project_url,encoding='gbk',error_bad_lines=False)
File "C:\Users\ASUS\AppData\Local\Programs\Python\Python38\lib\site-packages\pandas\io\parsers.py", line 686, in read_csv
return _read(filepath_or_buffer, kwds)
File "C:\Users\ASUS\AppData\Local\Programs\Python\Python38\lib\site-packages\pandas\io\parsers.py", line 452, in _read
parser = TextFileReader(fp_or_buf, **kwds)
File "C:\Users\ASUS\AppData\Local\Programs\Python\Python38\lib\site-packages\pandas\io\parsers.py", line 936, in __init__
self._make_engine(self.engine)
File "C:\Users\ASUS\AppData\Local\Programs\Python\Python38\lib\site-packages\pandas\io\parsers.py", line 1168, in _make_engine
self._engine = CParserWrapper(self.f, **self.options)
File "C:\Users\ASUS\AppData\Local\Programs\Python\Python38\lib\site-packages\pandas\io\parsers.py", line 1998, in __init__
self._reader = parsers.TextReader(src, **kwds)
File "pandas\_libs\parsers.pyx", line 540, in pandas._libs.parsers.TextReader.__cinit__
pandas.errors.EmptyDataError: No columns to parse from file
python快速接手别人的代码_Python 爬虫代码,网上找的别人的,但是报错,求高手指点...相关推荐
- 关于 使用python向qq好友发送消息(对爬虫的作用----当程序执行完毕或者报错无限给自己qq发送消息,直到关闭)...
以前看到网上一些小程序,在处理完事物后会自动发送qq消息,但是一直搞不懂是说明原理.也在网上找过一些python登陆qq发送消息的文字,但是都太复杂了.今天偶然看到一篇文章,是用python调用win ...
- python使用get和post方法_python爬虫中get和post方法介绍以及cookie作用
首先确定你要爬取的目标网站的表单提交方式,可以通过开发者工具看到.这里推荐使用chrome. 这里我用163邮箱为例 打开工具后再Network中,在Name选中想要了解的网站,右侧headers里的 ...
- 新手零基础:飞桨代码中关于图片路径读取和资源解压报错
#飞桨代码中关于图片路径读取和资源解压报错 1.路径读取 在进行路径图片读取时,不同版本的python的os模块在路径拼接时会报错,一般情况下os.path.join(path,name),是可以将路 ...
- SAP QM 执行事务代码QS51维护使用决策的选择集,系统报错 – Transaction no longer valid for catalog ‘3’ -
SAP QM 执行事务代码QS51维护使用决策的选择集,系统报错 – Transaction no longer valid for catalog '3' - 执行事务代码QS51,试图为工厂NMD ...
- SAP QM 执行事务代码QS23为检验特性分配Selected Set的时候报错 - You cannot use entries from catalogs 1 and 3-
SAP QM 执行事务代码QS23为检验特性分配Selected Set的时候报错 - You cannot use entries from catalogs 1 and 3- 我已经定义好了如下的 ...
- python快速接手别人的代码_十步教你如何接手别人的代码!
想必在很多程序员的职业生涯中,都有过一种难以避免的状况,即接下别人的代码.而这是种怎样的体验?有人说,接手别人的代码之后我也想辞职:有人说,一个连注释都没有的代码有何灵魂可言:更有网友说,如果你恨一个 ...
- python获取网站代码_python爬虫1——获取网站源代码(豆瓣图书top250信息)
# -*- coding: utf-8 -*- import requests import re import sys reload(sys) sys.setdefaultencoding('utf ...
- 爬虫python下载文献代码_Python爬虫案例:爬取微信公众号文章
本文的文字及图片来源于网络,仅供学习.交流使用,不具有任何商业用途,如有问题请及时联系我们以作处理. 文章转载于公众号:早起Python 作者:陈熹 大家好,今天我们来讲点Selenium自动化,你是 ...
- python爬虫知乎代码_python爬虫知乎的简单代码实现
随着时代的发展,我们很依赖网络帮助我们解决问题,遇到什么问题就会先百度.除了百度,现在大多数人还会选择通过知乎来解决问题.知乎类似于一个论坛,讨论度比百度高一些,那你知道如何用python爬虫爬知乎网 ...
最新文章
- 【2021-12-06】爬取关键词图片 - 去掉重复图片
- 报告 | 从20世纪70年代至今,自动驾驶汽车的发展经历了哪些历史性的变革?
- vsftpd类似wu-ftpd分类(Class)的配置-给不同网段的人以不同的上传权限-对虚拟用户进行访问IP限制...
- vc中调用其他应用程序的方法(函数) winexec,shellexecute ,createprocess
- 【Python】分享几个简单易懂的Python技巧,能够极大的提高工作效率哦!
- [HNOI2008]GT考试
- android studio import android-source-code
- Vue_(Router路由)-vue-router路由的基本用法
- python3 django开发_python3开发进阶-Django框架学习前的小项目(一个简单的学员管理系统)...
- 服务器2003系统U盘安装方法,u盘winpe下安装windows server 2003详细教程
- 每天学点Shiro-say hello
- Tensorflow基本语法和实现神经网络
- rplidar 三角测距激光雷达原理
- 25个常用Matplotlib图的Python代码,爱了爱了
- 1.42 财务测量指标——静态评价法(投资回报率+投资回收期)
- 国外常用免费博客平台
- 【异常检测论文】Anomaly Detection综述
- python星号画平行四边形_Python练习题 018:打印星号菱形
- iOS 10版本适配
- 单个正态总体方差的置信区间
热门文章
- linux调节伽马值软件,四个 Linux 下的“护眼”软件
- 网络层HTPPS和HTTP的概念与区别
- Julia Computing获得 2400 万美元融资,前 Snowflake CEO 加入董事会
- Springboot启动提示:com.alibaba.nacos.shaded.io.grpc.StatusRuntimeException: UNAVAILABLE: io exception
- rust被禁播还能玩吗_被强制下架的5部剧,后2部因“尺度太大”被禁播,如今已恢复上架...
- unity 图片遮罩有锯齿_如何消除UGUI Mask遮罩的锯齿
- php正则中英文数字,PHP正则匹配中英文、数字及下划线方法
- python批量压缩图片_Python图片批量压缩到指定大小并将JPG转为PNG格式
- wlop一张多少钱_小白有个问题,为什么很多人都说 WLOP 的画不够好?
- 在用origin画图时,图表左上角会出现大写字母C,去除方法: