2018-02-27 16:31:54 -05:00

116 lines
2.7 KiB
Python

import requests
from bs4 import BeautifulSoup
import multiprocessing
import os
proxy_index = 0
headers = {
"User-Agent": "Mozilla/5.0 (X11; Linux x86_64; rv:52.0) Gecko/20100101 Firefox/52.0",
"Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8",
"Accept-Language": "en-US,en;q=0.5",
"Accept-Encoding": "gzip, deflate, br",
"Upgrade-Insecure-Requests": "1"
}
proxies = {
'https': '',
}
def request_timeout(url):
while True:
try:
return requests.get(url, timeout=30)
except Exception as e:
print("!", end="", flush=True)
continue
def get_fonts():
for i in range(3758):
print(i)
r = request_timeout("https://fontmeme.com/fonts/page/" + str(i))
soup = BeautifulSoup(r.text, "html.parser")
for div in soup.findAll("div"):
if div.get("id") is not None and div.get("id") == "ptitle":
for child in div.children:
if child.get("href") is not None:
with open("fonts.txt", "a") as f:
f.write(child.get("href") + '\n')
def get_new_proxy():
global proxy_index
with open("proxies.txt", "r") as f:
line = f.read().splitlines()[proxy_index]
proxies["https"] = line
print("Switched to proxy " + line)
proxy_index += 1
def download_font(font_url):
file_path = "fonts/" + font_url[font_url[:-1].rfind("/")+1:-6] + ".zip"
if os.path.exists(file_path):
return
r1 = request_timeout(font_url)
dl_link_index = r1.text.find("https://fontmeme.com/fonts/download/")
if dl_link_index != -1:
dl_link = r1.text[dl_link_index: r1.text.find("'", dl_link_index)]
headers["Referer"] = font_url
try:
r = requests.get(dl_link, stream=True, headers=headers, proxies=proxies, cookies=r1.cookies, timeout=10)
except:
get_new_proxy()
return
if r.status_code != 200:
print(r.status_code)
return
reached_limit = False
with open(file_path, 'wb') as f:
for chunk in r.iter_content(chunk_size=1024):
if chunk:
f.write(chunk)
with open(file_path, "rb") as f:
if f.read().find(b"PK") != 0:
reached_limit = True
if reached_limit:
os.remove(file_path)
print("You have reached the maximum permitted downloads")
get_new_proxy()
def download_all():
pool = multiprocessing.Pool(processes=100)
with open("fonts.txt", "r") as f:
pool.map(download_font, f.read().splitlines())
# get_fonts()
# get_new_proxy()
download_all()