创建目录

SuperSharkV · SuperSharkV · commit b09f9f799980 · 2022-08-08T22:33:59.000+08:00
diff --git a/wuya/README.md b/wuya/README.md
@@ -0,0 +1,12 @@
+# Python 代码实例
+
+- [jdSignin](https://github.com/JustDoPython/python-examples/tree/master/wuya/jdSignin) : 3分钟写一个脚本，每天定时薅东哥羊毛
+- [shRent_1](https://github.com/JustDoPython/python-examples/tree/master/wuya/shRent_1) : 为了在上海租房，我用python连夜爬了20000多条房源信息...
+
+---
+
+从小白到工程师的学习之路
+
+关注公众号：python 技术，回复"python"一起学习交流
+
+![](http://favorites.ren/assets/images/python.jpg)
diff --git a/wuya/jdSignin/jd_sign.py b/wuya/jdSignin/jd_sign.py
@@ -0,0 +1,25 @@
+#pt_key=AAJi2BVXADDKWR6SHbo_ARE3SS6Bv7y-nKo0aWKLQjiYCcmreYfTUHN15o-nlRdh2M3iwV5kYv8; pt_pin=zhongulou; 
+import requests
+
+pt_key="替换为自己的pt_key"
+pt_pin="替换为自己的pt_pin"
+cookie="pt_key={}; pt_pin={}".format(pt_key, pt_pin)
+url = "https://api.m.jd.com/client.action?functionId=signBeanAct&body=%7B%22fp%22%3A%22-1%22%2C%22shshshfp%22%3A%22-1%22%2C%22shshshfpa%22%3A%22-1%22%2C%22referUrl%22%3A%22-1%22%2C%22userAgent%22%3A%22-1%22%2C%22jda%22%3A%22-1%22%2C%22rnVersion%22%3A%223.9%22%7D&appid=ld";
+headers = {
+    "Content-Type":"application/x-www-form-urlencoded; charset=UTF-8",
+    "User-Agent": "okhttp/3.12.1;jdmall;android;version/10.3.4;build/92451;",
+    "Cookie": cookie
+}
+
+response = requests.post(url=url, headers=headers)
+print(response.text)
+
+res = response.json()
+returnMes = ""
+
+if(res.get("errorMessage")==None):
+    returnMes = "签到成功！"
+else:
+    returnMes = "签到失败".format(res.get("errorMessage"))
+
+requests.get("https://sctapi.ftqq.com/这里填写你个人的SendKey.send?title={}".format(returnMes))
diff --git a/wuya/shRent_1/shRent_1.py b/wuya/shRent_1/shRent_1.py
@@ -0,0 +1,57 @@
+#通过某租房网站首页接口爬取租房房源信息
+import time, re, csv, requests
+import codecs
+from bs4 import BeautifulSoup
+
+list=['jingan','xuhui','huangpu','changning','putuo','pudong','baoshan','hongkou','yangpu','minhang','jinshan','jiading','chongming','fengxian','songjiang','qingpu']
+print("****处理开始****")
+with open(r'..\document\sh.csv', 'wb+')as fp:
+    fp.write(codecs.BOM_UTF8)
+f = open(r'..\document\sh.csv','w+',newline='', encoding='utf-8')
+writer = csv.writer(f)
+urls = []
+
+for a in list:
+    urls.append('https://sh.lianjia.com/zufang/{}/pg1rco11/'.format(a))
+    headers = {'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/81.0.4044.9 Safari/537.36'}
+
+    res = requests.get('https://sh.lianjia.com/zufang/{}/pg1rco11/'.format(a), headers=headers)
+    content = res.text
+    soup = BeautifulSoup(content, 'html.parser')
+    page_num = int(soup.find('div', attrs={'class': 'content__pg'}).attrs['data-totalpage'])
+    for i in range(2,page_num+1):
+        urls.append('https://sh.lianjia.com/zufang/{}/pg{}rco11/'.format(a,i))
+
+print(urls)
+
+num=1
+for url in urls:
+    print("正在处理第{}页数据...".format(str(num)))
+    res1 = requests.get(url, headers=headers)
+    content1 = res1.text
+    soup1 = BeautifulSoup(content1, 'html.parser')
+    infos = soup1.find('div', {'class': 'content__list'}).find_all('div', {'class': 'content__list--item'})
+
+    for info in infos:
+
+        house_url = 'https://sh.lianjia.com' + info.a['href']
+        title = info.find('p', {'class': 'content__list--item--title'}).find('a').get_text().strip()
+        group = title.split()[0][3:]
+        price = info.find('span', {'class': 'content__list--item-price'}).get_text()
+        tag = info.find('p', {'class': 'content__list--item--bottom oneline'}).get_text()
+        mixed = info.find('p', {'class': 'content__list--item--des'}).get_text()
+        mix = re.split(r'/', mixed)
+        address = mix[0].strip()
+        area = mix[1].strip()
+        door_orientation = mix[2].strip()
+        style = mix[-1].strip()
+        region = re.split(r'-', address)[0]
+        writer.writerow((house_url, title, group, price, area, address, door_orientation, style, tag, region))
+        time.sleep(0)
+    print("第{}页数据处理完毕，共{}条数据。".format(str(num), len(infos)))
+    num+=1
+
+
+f.close()
+print("****全部完成****")
+