2019-02-02 10:18:57 +00:00
|
|
|
import os
|
|
|
|
import sqlite3
|
|
|
|
|
2019-02-15 10:47:50 +00:00
|
|
|
from cfg import config
|
|
|
|
if(not config["use_sqlite"]):
|
|
|
|
import pymysql
|
|
|
|
|
2019-02-02 10:18:57 +00:00
|
|
|
from proxy import fetch_proxies
|
|
|
|
|
2019-02-25 13:43:15 +00:00
|
|
|
def get_cache():
|
2019-02-15 10:47:50 +00:00
|
|
|
if(config["use_sqlite"]):
|
2019-02-25 13:43:15 +00:00
|
|
|
directory = config["sqlite_cache_directory"]
|
|
|
|
name = config["sqlite_cache_name"]
|
2019-02-15 10:47:50 +00:00
|
|
|
cache_file = os.path.join(directory, "{}.sqlite".format(name))
|
|
|
|
if(not os.path.exists(cache_file)):
|
|
|
|
with open(cache_file, "w") as fin:
|
|
|
|
pass
|
|
|
|
db = sqlite3.connect(cache_file)
|
|
|
|
|
|
|
|
cursor = db.cursor()
|
|
|
|
|
|
|
|
cursor.execute("CREATE TABLE proxies(proxy TEXT, lasttime_could_not_be_used DECIMAL)")
|
2019-02-19 13:16:22 +00:00
|
|
|
cursor.execute("CREATE TABLE links(source INT, destination INT)")
|
|
|
|
cursor.execute("CREATE TABLE dijkstra_helper(page INT UNIQUE, value INT)")
|
|
|
|
cursor.execute("CREATE TABLE failed_to_fetch(page INT, depth INT)")
|
|
|
|
cursor.execute("CREATE TABLE pages(title TEXT)")
|
2019-02-15 10:47:50 +00:00
|
|
|
|
|
|
|
db.commit()
|
2019-02-02 10:18:57 +00:00
|
|
|
db = sqlite3.connect(cache_file)
|
2019-02-15 10:47:50 +00:00
|
|
|
fetch_proxies(db)
|
|
|
|
return db
|
|
|
|
db = pymysql.connect(
|
|
|
|
host=config["mysql_server"]
|
|
|
|
, user=config["mysql_user"]
|
|
|
|
, password=config["mysql_password"]
|
|
|
|
, db=config["mysql_database"]
|
2019-02-15 11:46:32 +00:00
|
|
|
, charset="utf8mb4")
|
2019-02-02 10:18:57 +00:00
|
|
|
|
2019-02-15 10:47:50 +00:00
|
|
|
cursor = db.cursor()
|
2019-02-02 10:18:57 +00:00
|
|
|
|
2019-02-15 10:47:50 +00:00
|
|
|
cursor.execute("CREATE TABLE IF NOT EXISTS proxies(proxy varchar(100), lasttime_could_not_be_used DECIMAL)")
|
2019-02-19 13:16:22 +00:00
|
|
|
cursor.execute("CREATE TABLE IF NOT EXISTS links(source INT, destination INT)")
|
|
|
|
cursor.execute("CREATE TABLE IF NOT EXISTS dijkstra_helper(page INT UNIQUE, value INT)")
|
|
|
|
cursor.execute("CREATE TABLE IF NOT EXISTS failed_to_fetch(page INT, depth INT)")
|
|
|
|
cursor.execute('''CREATE TABLE IF NOT EXISTS
|
|
|
|
pages(
|
|
|
|
title varchar(400) CHARACTER SET utf8mb4
|
|
|
|
, page_id INT AUTO_INCREMENT
|
|
|
|
, PRIMARY KEY(page_id)
|
|
|
|
)''')
|
2019-02-02 10:18:57 +00:00
|
|
|
|
2019-02-15 10:47:50 +00:00
|
|
|
db.commit()
|
2019-02-15 11:46:32 +00:00
|
|
|
fetch_proxies(db)
|
2019-02-02 10:18:57 +00:00
|
|
|
return db
|
2019-02-15 10:47:50 +00:00
|
|
|
|
2019-02-02 10:18:57 +00:00
|
|
|
|
|
|
|
def clear_cache_data(connection):
|
|
|
|
cursor = connection.cursor()
|
|
|
|
cursor.execute("DELETE FROM links")
|
|
|
|
cursor.execute("DELETE FROM dijkstra_helper")
|
|
|
|
connection.commit()
|