200 lines
7.2 KiB
Python
200 lines
7.2 KiB
Python
|
from app.filter import clean_query
|
||
|
from app.request import send_tor_signal
|
||
|
from app.utils.session import generate_key
|
||
|
from app.utils.bangs import gen_bangs_json, load_all_bangs
|
||
|
from app.utils.misc import gen_file_hash, read_config_bool
|
||
|
from base64 import b64encode
|
||
|
from bs4 import MarkupResemblesLocatorWarning
|
||
|
from datetime import datetime, timedelta
|
||
|
from dotenv import load_dotenv
|
||
|
from flask import Flask
|
||
|
import json
|
||
|
import logging.config
|
||
|
import os
|
||
|
from stem import Signal
|
||
|
import threading
|
||
|
import warnings
|
||
|
|
||
|
from werkzeug.middleware.proxy_fix import ProxyFix
|
||
|
|
||
|
from app.utils.misc import read_config_bool
|
||
|
from app.version import __version__
|
||
|
|
||
|
app = Flask(__name__, static_folder=os.path.dirname(
|
||
|
os.path.abspath(__file__)) + '/static')
|
||
|
|
||
|
app.wsgi_app = ProxyFix(app.wsgi_app)
|
||
|
|
||
|
# look for WHOOGLE_ENV, else look in parent directory
|
||
|
dot_env_path = os.getenv(
|
||
|
"WHOOGLE_DOTENV_PATH",
|
||
|
os.path.join(os.path.dirname(os.path.abspath(__file__)), "../whoogle.env"))
|
||
|
|
||
|
# Load .env file if enabled
|
||
|
if os.path.exists(dot_env_path):
|
||
|
load_dotenv(dot_env_path)
|
||
|
|
||
|
app.enc_key = generate_key()
|
||
|
|
||
|
if read_config_bool('HTTPS_ONLY'):
|
||
|
app.config['SESSION_COOKIE_NAME'] = '__Secure-session'
|
||
|
app.config['SESSION_COOKIE_SECURE'] = True
|
||
|
|
||
|
app.config['VERSION_NUMBER'] = __version__
|
||
|
app.config['APP_ROOT'] = os.getenv(
|
||
|
'APP_ROOT',
|
||
|
os.path.dirname(os.path.abspath(__file__)))
|
||
|
app.config['STATIC_FOLDER'] = os.getenv(
|
||
|
'STATIC_FOLDER',
|
||
|
os.path.join(app.config['APP_ROOT'], 'static'))
|
||
|
app.config['BUILD_FOLDER'] = os.path.join(
|
||
|
app.config['STATIC_FOLDER'], 'build')
|
||
|
app.config['CACHE_BUSTING_MAP'] = {}
|
||
|
app.config['LANGUAGES'] = json.load(open(
|
||
|
os.path.join(app.config['STATIC_FOLDER'], 'settings/languages.json'),
|
||
|
encoding='utf-8'))
|
||
|
app.config['COUNTRIES'] = json.load(open(
|
||
|
os.path.join(app.config['STATIC_FOLDER'], 'settings/countries.json'),
|
||
|
encoding='utf-8'))
|
||
|
app.config['TIME_PERIODS'] = json.load(open(
|
||
|
os.path.join(app.config['STATIC_FOLDER'], 'settings/time_periods.json'),
|
||
|
encoding='utf-8'))
|
||
|
app.config['TRANSLATIONS'] = json.load(open(
|
||
|
os.path.join(app.config['STATIC_FOLDER'], 'settings/translations.json'),
|
||
|
encoding='utf-8'))
|
||
|
app.config['THEMES'] = json.load(open(
|
||
|
os.path.join(app.config['STATIC_FOLDER'], 'settings/themes.json'),
|
||
|
encoding='utf-8'))
|
||
|
app.config['HEADER_TABS'] = json.load(open(
|
||
|
os.path.join(app.config['STATIC_FOLDER'], 'settings/header_tabs.json'),
|
||
|
encoding='utf-8'))
|
||
|
app.config['CONFIG_PATH'] = os.getenv(
|
||
|
'CONFIG_VOLUME',
|
||
|
os.path.join(app.config['STATIC_FOLDER'], 'config'))
|
||
|
app.config['DEFAULT_CONFIG'] = os.path.join(
|
||
|
app.config['CONFIG_PATH'],
|
||
|
'config.json')
|
||
|
app.config['CONFIG_DISABLE'] = read_config_bool('WHOOGLE_CONFIG_DISABLE')
|
||
|
app.config['SESSION_FILE_DIR'] = os.path.join(
|
||
|
app.config['CONFIG_PATH'],
|
||
|
'session')
|
||
|
app.config['MAX_SESSION_SIZE'] = 4000 # Sessions won't exceed 4KB
|
||
|
app.config['BANG_PATH'] = os.getenv(
|
||
|
'CONFIG_VOLUME',
|
||
|
os.path.join(app.config['STATIC_FOLDER'], 'bangs'))
|
||
|
app.config['BANG_FILE'] = os.path.join(
|
||
|
app.config['BANG_PATH'],
|
||
|
'bangs.json')
|
||
|
|
||
|
# Ensure all necessary directories exist
|
||
|
if not os.path.exists(app.config['CONFIG_PATH']):
|
||
|
os.makedirs(app.config['CONFIG_PATH'])
|
||
|
|
||
|
if not os.path.exists(app.config['SESSION_FILE_DIR']):
|
||
|
os.makedirs(app.config['SESSION_FILE_DIR'])
|
||
|
|
||
|
if not os.path.exists(app.config['BANG_PATH']):
|
||
|
os.makedirs(app.config['BANG_PATH'])
|
||
|
|
||
|
if not os.path.exists(app.config['BUILD_FOLDER']):
|
||
|
os.makedirs(app.config['BUILD_FOLDER'])
|
||
|
|
||
|
# Session values
|
||
|
app_key_path = os.path.join(app.config['CONFIG_PATH'], 'whoogle.key')
|
||
|
if os.path.exists(app_key_path):
|
||
|
try:
|
||
|
app.config['SECRET_KEY'] = open(app_key_path, 'r').read()
|
||
|
except PermissionError:
|
||
|
app.config['SECRET_KEY'] = str(b64encode(os.urandom(32)))
|
||
|
else:
|
||
|
app.config['SECRET_KEY'] = str(b64encode(os.urandom(32)))
|
||
|
with open(app_key_path, 'w') as key_file:
|
||
|
key_file.write(app.config['SECRET_KEY'])
|
||
|
key_file.close()
|
||
|
app.config['PERMANENT_SESSION_LIFETIME'] = timedelta(days=365)
|
||
|
|
||
|
# NOTE: SESSION_COOKIE_SAMESITE must be set to 'lax' to allow the user's
|
||
|
# previous session to persist when accessing the instance from an external
|
||
|
# link. Setting this value to 'strict' causes Whoogle to revalidate a new
|
||
|
# session, and fail, resulting in cookies being disabled.
|
||
|
app.config['SESSION_COOKIE_SAMESITE'] = 'Strict'
|
||
|
|
||
|
# Config fields that are used to check for updates
|
||
|
app.config['RELEASES_URL'] = 'https://github.com/' \
|
||
|
'benbusby/whoogle-search/releases'
|
||
|
app.config['LAST_UPDATE_CHECK'] = datetime.now() - timedelta(hours=24)
|
||
|
app.config['HAS_UPDATE'] = ''
|
||
|
|
||
|
# The alternative to Google Translate is treated a bit differently than other
|
||
|
# social media site alternatives, in that it is used for any translation
|
||
|
# related searches.
|
||
|
translate_url = os.getenv('WHOOGLE_ALT_TL', 'https://farside.link/lingva')
|
||
|
if not translate_url.startswith('http'):
|
||
|
translate_url = 'https://' + translate_url
|
||
|
app.config['TRANSLATE_URL'] = translate_url
|
||
|
|
||
|
app.config['CSP'] = 'default-src \'none\';' \
|
||
|
'frame-src ' + translate_url + ';' \
|
||
|
'manifest-src \'self\';' \
|
||
|
'img-src \'self\' data:;' \
|
||
|
'style-src \'self\' \'unsafe-inline\';' \
|
||
|
'script-src \'self\';' \
|
||
|
'media-src \'self\';' \
|
||
|
'connect-src \'self\';'
|
||
|
|
||
|
# Generate DDG bang filter
|
||
|
generating_bangs = False
|
||
|
if not os.path.exists(app.config['BANG_FILE']):
|
||
|
generating_bangs = True
|
||
|
json.dump({}, open(app.config['BANG_FILE'], 'w'))
|
||
|
bangs_thread = threading.Thread(
|
||
|
target=gen_bangs_json,
|
||
|
args=(app.config['BANG_FILE'],))
|
||
|
bangs_thread.start()
|
||
|
|
||
|
# Build new mapping of static files for cache busting
|
||
|
cache_busting_dirs = ['css', 'js']
|
||
|
for cb_dir in cache_busting_dirs:
|
||
|
full_cb_dir = os.path.join(app.config['STATIC_FOLDER'], cb_dir)
|
||
|
for cb_file in os.listdir(full_cb_dir):
|
||
|
# Create hash from current file state
|
||
|
full_cb_path = os.path.join(full_cb_dir, cb_file)
|
||
|
cb_file_link = gen_file_hash(full_cb_dir, cb_file)
|
||
|
build_path = os.path.join(app.config['BUILD_FOLDER'], cb_file_link)
|
||
|
|
||
|
try:
|
||
|
os.symlink(full_cb_path, build_path)
|
||
|
except FileExistsError:
|
||
|
# Symlink hasn't changed, ignore
|
||
|
pass
|
||
|
|
||
|
# Create mapping for relative path urls
|
||
|
map_path = build_path.replace(app.config['APP_ROOT'], '')
|
||
|
if map_path.startswith('/'):
|
||
|
map_path = map_path[1:]
|
||
|
app.config['CACHE_BUSTING_MAP'][cb_file] = map_path
|
||
|
|
||
|
# Templating functions
|
||
|
app.jinja_env.globals.update(clean_query=clean_query)
|
||
|
app.jinja_env.globals.update(
|
||
|
cb_url=lambda f: app.config['CACHE_BUSTING_MAP'][f.lower()])
|
||
|
|
||
|
# Attempt to acquire tor identity, to determine if Tor config is available
|
||
|
send_tor_signal(Signal.HEARTBEAT)
|
||
|
|
||
|
# Suppress spurious warnings from BeautifulSoup
|
||
|
warnings.simplefilter('ignore', MarkupResemblesLocatorWarning)
|
||
|
|
||
|
from app import routes # noqa
|
||
|
|
||
|
# The gen_bangs_json function takes care of loading bangs, so skip it here if
|
||
|
# it's already being loaded
|
||
|
if not generating_bangs:
|
||
|
load_all_bangs(app.config['BANG_FILE'])
|
||
|
|
||
|
# Disable logging from imported modules
|
||
|
logging.config.dictConfig({
|
||
|
'version': 1,
|
||
|
'disable_existing_loggers': True,
|
||
|
})
|