2020-06-02 21:54:47 +03:00
|
|
|
from app.filter import Filter, get_first_link
|
2020-07-26 20:53:59 +03:00
|
|
|
from app.utils.session_utils import generate_user_keys
|
2020-06-02 21:54:47 +03:00
|
|
|
from app.request import gen_query
|
2020-12-18 00:06:47 +03:00
|
|
|
from bs4 import BeautifulSoup as bsoup
|
2020-06-02 21:54:47 +03:00
|
|
|
from cryptography.fernet import Fernet, InvalidToken
|
|
|
|
from flask import g
|
|
|
|
from typing import Any, Tuple
|
2021-01-23 22:50:30 +03:00
|
|
|
import os
|
2020-06-02 21:54:47 +03:00
|
|
|
|
Add tor and http/socks proxy support (#137)
* Add tor and http/socks proxy support
Allows users to enable/disable tor from the config menu, which will
forward all requests through Tor.
Also adds support for setting environment variables for alternative
proxy support. Setting the following variables will forward requests
through the proxy:
- WHOOGLE_PROXY_USER (optional)
- WHOOGLE_PROXY_PASS (optional)
- WHOOGLE_PROXY_TYPE (required)
- Can be "http", "socks4", or "socks5"
- WHOOGLE_PROXY_LOC (required)
- Format: "<ip address>:<port>"
See #30
* Refactor acquire_tor_conn -> acquire_tor_identity
Also updated travis CI to set up tor
* Add check for Tor socket on init, improve Tor error handling
Initializing the app sends a heartbeat request to Tor to check for
availability, and updates the home page config options accordingly. This
heartbeat is sent on every request, to ensure Tor support can be
reconfigured without restarting the entire app.
If Tor support is enabled, and a subsequent request fails, then a new
TorError exception is raised, and the Tor feature is disabled until a
valid connection is restored.
The max attempts has been updated to 10, since 5 seemed a bit too low
for how quickly the attempts go by.
* Change send_tor_signal arg type, update function doc
send_tor_signal now accepts a stem.Signal arg (a bit cleaner tbh). Also
added the doc string for the "disable" attribute in TorError.
* Fix tor identity logic in Request.send
* Update proxy init, change proxyloc var name
Proxy is now only initialized if both type and location are specified,
as neither have a default fallback and both are required. I suppose the
type could fall back to http, but seems safer this way.
Also refactored proxyurl -> proxyloc for the runtime args in order to
match the Dockerfile args.
* Add tor/proxy support for Docker builds, fix opensearch/init
The Dockerfile is now updated to include support for Tor configuration,
with a working torrc file included in the repo.
An issue with opensearch was fixed as well, which was uncovered during
testing and was simple enough to fix here. Likewise, DDG bang gen was
updated to only ever happen if the file didn't exist previously, as
testing with the file being regenerated every time was tedious.
* Add missing "@" for socks proxy requests
2020-10-29 03:47:42 +03:00
|
|
|
TOR_BANNER = '<hr><h1 style="text-align: center">You are using Tor</h1><hr>'
|
|
|
|
|
|
|
|
|
2021-01-23 22:50:30 +03:00
|
|
|
def needs_https(url: str) -> bool:
|
|
|
|
https_only = os.getenv('HTTPS_ONLY', False)
|
|
|
|
is_heroku = url.endswith('.herokuapp.com')
|
|
|
|
is_http = url.startswith('http://')
|
|
|
|
|
|
|
|
return (is_heroku and is_http) or (https_only and is_http)
|
|
|
|
|
|
|
|
|
2020-06-02 21:54:47 +03:00
|
|
|
class RoutingUtils:
|
2020-06-06 00:24:44 +03:00
|
|
|
def __init__(self, request, config, session, cookies_disabled=False):
|
2020-12-18 00:06:47 +03:00
|
|
|
method = request.method
|
|
|
|
self.request_params = request.args if method == 'GET' else request.form
|
2020-06-02 21:54:47 +03:00
|
|
|
self.user_agent = request.headers.get('User-Agent')
|
|
|
|
self.feeling_lucky = False
|
|
|
|
self.config = config
|
|
|
|
self.session = session
|
|
|
|
self.query = ''
|
2020-06-06 00:24:44 +03:00
|
|
|
self.cookies_disabled = cookies_disabled
|
2020-12-18 00:06:47 +03:00
|
|
|
self.search_type = self.request_params.get(
|
|
|
|
'tbm') if 'tbm' in self.request_params else ''
|
2020-06-02 21:54:47 +03:00
|
|
|
|
|
|
|
def __getitem__(self, name):
|
|
|
|
return getattr(self, name)
|
|
|
|
|
|
|
|
def __setitem__(self, name, value):
|
|
|
|
return setattr(self, name, value)
|
|
|
|
|
|
|
|
def __delitem__(self, name):
|
|
|
|
return delattr(self, name)
|
|
|
|
|
|
|
|
def __contains__(self, name):
|
|
|
|
return hasattr(self, name)
|
|
|
|
|
|
|
|
def new_search_query(self) -> str:
|
2020-06-06 00:24:44 +03:00
|
|
|
# Generate a new element key each time a new search is performed
|
2020-06-11 21:14:57 +03:00
|
|
|
self.session['fernet_keys']['element_key'] = generate_user_keys(
|
|
|
|
cookies_disabled=self.cookies_disabled)['element_key']
|
2020-06-02 21:54:47 +03:00
|
|
|
|
|
|
|
q = self.request_params.get('q')
|
|
|
|
|
|
|
|
if q is None or len(q) == 0:
|
|
|
|
return ''
|
|
|
|
else:
|
|
|
|
# Attempt to decrypt if this is an internal link
|
|
|
|
try:
|
2020-12-18 00:06:47 +03:00
|
|
|
q = Fernet(
|
|
|
|
self.session['fernet_keys']['text_key']
|
|
|
|
).decrypt(q.encode()).decode()
|
2020-06-02 21:54:47 +03:00
|
|
|
except InvalidToken:
|
|
|
|
pass
|
|
|
|
|
|
|
|
# Reset text key
|
2020-06-11 21:14:57 +03:00
|
|
|
self.session['fernet_keys']['text_key'] = generate_user_keys(
|
|
|
|
cookies_disabled=self.cookies_disabled)['text_key']
|
2020-06-02 21:54:47 +03:00
|
|
|
|
2020-12-18 00:06:47 +03:00
|
|
|
# Strip leading '! ' for "feeling lucky" queries
|
2020-06-02 21:54:47 +03:00
|
|
|
self.feeling_lucky = q.startswith('! ')
|
|
|
|
self.query = q[2:] if self.feeling_lucky else q
|
|
|
|
return self.query
|
|
|
|
|
2020-10-10 22:55:14 +03:00
|
|
|
def bang_operator(self, bangs_dict: dict) -> str:
|
|
|
|
for operator in bangs_dict.keys():
|
2020-12-18 00:06:47 +03:00
|
|
|
if self.query.split(' ')[0] != operator:
|
|
|
|
continue
|
|
|
|
|
|
|
|
return bangs_dict[operator]['url'].format(
|
|
|
|
self.query.replace(operator, '').strip())
|
2020-06-26 01:26:02 +03:00
|
|
|
return ''
|
|
|
|
|
2020-06-02 21:54:47 +03:00
|
|
|
def generate_response(self) -> Tuple[Any, int]:
|
|
|
|
mobile = 'Android' in self.user_agent or 'iPhone' in self.user_agent
|
|
|
|
|
2020-12-18 00:06:47 +03:00
|
|
|
content_filter = Filter(
|
|
|
|
self.session['fernet_keys'],
|
|
|
|
mobile=mobile,
|
|
|
|
config=self.config)
|
|
|
|
full_query = gen_query(
|
|
|
|
self.query,
|
|
|
|
self.request_params,
|
|
|
|
self.config,
|
|
|
|
content_filter.near)
|
Add tor and http/socks proxy support (#137)
* Add tor and http/socks proxy support
Allows users to enable/disable tor from the config menu, which will
forward all requests through Tor.
Also adds support for setting environment variables for alternative
proxy support. Setting the following variables will forward requests
through the proxy:
- WHOOGLE_PROXY_USER (optional)
- WHOOGLE_PROXY_PASS (optional)
- WHOOGLE_PROXY_TYPE (required)
- Can be "http", "socks4", or "socks5"
- WHOOGLE_PROXY_LOC (required)
- Format: "<ip address>:<port>"
See #30
* Refactor acquire_tor_conn -> acquire_tor_identity
Also updated travis CI to set up tor
* Add check for Tor socket on init, improve Tor error handling
Initializing the app sends a heartbeat request to Tor to check for
availability, and updates the home page config options accordingly. This
heartbeat is sent on every request, to ensure Tor support can be
reconfigured without restarting the entire app.
If Tor support is enabled, and a subsequent request fails, then a new
TorError exception is raised, and the Tor feature is disabled until a
valid connection is restored.
The max attempts has been updated to 10, since 5 seemed a bit too low
for how quickly the attempts go by.
* Change send_tor_signal arg type, update function doc
send_tor_signal now accepts a stem.Signal arg (a bit cleaner tbh). Also
added the doc string for the "disable" attribute in TorError.
* Fix tor identity logic in Request.send
* Update proxy init, change proxyloc var name
Proxy is now only initialized if both type and location are specified,
as neither have a default fallback and both are required. I suppose the
type could fall back to http, but seems safer this way.
Also refactored proxyurl -> proxyloc for the runtime args in order to
match the Dockerfile args.
* Add tor/proxy support for Docker builds, fix opensearch/init
The Dockerfile is now updated to include support for Tor configuration,
with a working torrc file included in the repo.
An issue with opensearch was fixed as well, which was uncovered during
testing and was simple enough to fix here. Likewise, DDG bang gen was
updated to only ever happen if the file didn't exist previously, as
testing with the file being regenerated every time was tedious.
* Add missing "@" for socks proxy requests
2020-10-29 03:47:42 +03:00
|
|
|
get_body = g.user_request.send(query=full_query)
|
2020-06-02 21:54:47 +03:00
|
|
|
|
|
|
|
# Produce cleanable html soup from response
|
2020-12-18 00:06:47 +03:00
|
|
|
html_soup = bsoup(content_filter.reskin(get_body.text), 'html.parser')
|
|
|
|
html_soup.insert(
|
|
|
|
0,
|
|
|
|
bsoup(TOR_BANNER, 'html.parser')
|
|
|
|
if g.user_request.tor_valid else bsoup('', 'html.parser'))
|
2020-06-02 21:54:47 +03:00
|
|
|
|
|
|
|
if self.feeling_lucky:
|
|
|
|
return get_first_link(html_soup), 1
|
|
|
|
else:
|
|
|
|
formatted_results = content_filter.clean(html_soup)
|
2020-11-11 08:40:49 +03:00
|
|
|
|
|
|
|
# Append user config to all search links, if available
|
2020-12-18 00:06:47 +03:00
|
|
|
param_str = ''.join('&{}={}'.format(k, v)
|
|
|
|
for k, v in
|
|
|
|
self.request_params.to_dict(flat=True).items()
|
|
|
|
if self.config.is_safe_key(k))
|
2020-11-11 08:40:49 +03:00
|
|
|
for link in formatted_results.find_all('a', href=True):
|
2020-12-18 00:06:47 +03:00
|
|
|
if 'search?' not in link['href'] or link['href'].index(
|
|
|
|
'search?') > 1:
|
2020-11-11 08:40:49 +03:00
|
|
|
continue
|
|
|
|
link['href'] += param_str
|
|
|
|
|
2020-06-02 21:54:47 +03:00
|
|
|
return formatted_results, content_filter.elements
|