is-github-page/main.py

38 lines
1.2 KiB
Python
Raw Normal View History

2021-11-21 00:15:48 -08:00
import socket
import os
import urllib.request
2021-11-21 00:49:49 -08:00
import urllib.parse
2021-11-21 00:15:48 -08:00
num = 1
githubip = urllib.request.urlopen('https://api.github.com/meta')
githubip = str(githubip.read())
2021-11-21 00:49:49 -08:00
try:
os.system("wget https://github.com/timqian/chinese-independent-blogs/raw/master/blogs-original.csv -O ./blogs-original.csv")
with open('blogs-original.csv', 'r') as f:
lines = f.read()
except:
print("您似乎没有安装wget请手动下载文件 https://github.com/timqian/chinese-independent-blogs/raw/master/blogs-original.csv 并放至当前目录")
else:
with open('blogs-original.csv', 'r') as f:
lines = f.read()
lines = lines.splitlines()
with open('gh-domains.txt', 'w') as f:
for line in lines[1:]:
print(num)
num = num + 1
line = line.replace(" ", "").split(',')
res = urllib.parse.urlparse(line[1])
domain = res.netloc
try:
ip = socket.gethostbyname(domain)
ip = ip.split('.')
ip_head = ip[0]+'.'+ip[1]+'.'+ip[2]
isfind = githubip.find(ip_head)
if isfind != -1 :
f.write(domain+"\n")
print(domain+" is on GH-page!")
except:
continue
os.system("rm blogs-original.csv -rf")