python MoJaVe
2021/11/2 22:09:55
本文主要是介绍python MoJaVe,对大家解决编程问题具有一定的参考价值,需要的程序猿们随着小编来一起学习吧!
import requests import pandas as pd import numpy as np import os from lxml import etree class Mojave(): def __init__(self): workDir = "MOJAVE" self.url = "http://www.physics.purdue.edu/astro/MOJAVE/allsources.html" self.headers = {"User-Agent": "Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:92.0) Gecko/20100101 Firefox/92.0"} self.makeDir(workDir) def makeDir(self, dir): """ 创建目录,首先判断当前目录下是否存在活目录名字,存在就直接转入,不然就创建之后再转入 """ if os.path.exists(dir): os.chdir(dir) else: os.mkdir(dir) os.chdir(dir) def mainPage(self,url): """ :return: MOJAVE主页html """ try: response = requests.get(url=url, headers=self.headers,timeout=20) html = etree.HTML(response.text) return html except: print("爬取失败") def subPage(self): html=self.mainPage(url="http://www.physics.purdue.edu/astro/MOJAVE/sourcepages/0011+189.shtml") elements=html.xpath('/html/body/center/table[3]/tbody/tr[6]') print(len(elements)) def currentlySourceList(self): html = self.mainPage(url=self.url) currentlyUrl = ["http://www.physics.purdue.edu/astro/MOJAVE/" + i for i in html.xpath('//td[@style="background-color:rgb(204, 255, 255);"]/small/a/@href')] currentlyName = [i.replace(" ", "") for i in html.xpath('//td[@style="background-color:rgb(204, 255, 255);"]/small/a/text()')] return list(zip(currentlyName, currentlyUrl)) def noLongerSourceNameList(self): html = self.mainPage(url=self.url) noLongerUrl = ["http://www.physics.purdue.edu/astro/MOJAVE/" + i for i in html.xpath('//td[@bgcolor="#FFFFCC"]/small/a/@href')] cnoLongerName = [i.replace(" ", "") for i in html.xpath('//td[@bgcolor="#FFFFCC"]/small/a/text()')] return list(zip(noLongerUrl, cnoLongerName)) def _download(self,url,name): try: response=requests.get(url=url,headers=self.headers) with open(name,"wb") as file: file.write(response.content) print(name+"下载成功") except: print(name+"++++++++++++++++++++++++++下载失败") if __name__ == "__main__": Mojave().subPage()
这篇关于python MoJaVe的文章就介绍到这儿,希望我们推荐的文章对大家有所帮助,也希望大家多多支持为之网!
- 2025-01-03用FastAPI掌握Python异步IO:轻松实现高并发网络请求处理
- 2025-01-02封装学习:Python面向对象编程基础教程
- 2024-12-28Python编程基础教程
- 2024-12-27Python编程入门指南
- 2024-12-27Python编程基础
- 2024-12-27Python编程基础教程
- 2024-12-27Python编程基础指南
- 2024-12-24Python编程入门指南
- 2024-12-24Python编程基础入门
- 2024-12-24Python编程基础:变量与数据类型