blob: d0869e31bc1388e4e84423e9d11b9c24fc8291d8 [file] [log] [blame] [edit]
#!/usr/bin/python3
import cgi, os, socket, sys, urllib2
import common
from multiprocessing import pool
from frontend import setup_django_environment
from client.common_lib import global_config
from client.bin import utils
from frontend.afe.json_rpc import serviceHandler
from server import system_utils
from server import utils as server_utils
_PAGE = """\
Status: 302 Found
Content-Type: text/plain
Location: %s\r\n\r
"""
VIEWER_PREFIX = 'stainless.corp.google.com/browse/'
# Define function for retrieving logs
def _retrieve_logs_dummy(job_path):
pass
site_retrieve_logs = utils.import_site_function(__file__,
"tko.site_retrieve_logs", "site_retrieve_logs",
_retrieve_logs_dummy)
site_find_repository_host = utils.import_site_function(__file__,
"tko.site_retrieve_logs", "site_find_repository_host",
_retrieve_logs_dummy)
form = cgi.FieldStorage(keep_blank_values=True)
# determine if this is a JSON-RPC request. we support both so that the new TKO
# client can use its RPC client code, but the old TKO can still use simple GET
# params.
_is_json_request = form.has_key('callback')
# if this key exists, we check if requested log exists in local machine,
# and do not return Google Storage URL when the log doesn't exist.
_local_only = form.has_key('localonly')
def _get_requested_path():
if _is_json_request:
request_data = form['request'].value
request = serviceHandler.ServiceHandler.translateRequest(request_data)
parameters = request['params'][0]
return parameters['path']
return form['job'].value
def _check_result(args):
host = args['host']
job_path = args['job_path']
shard = args['shard']
if shard:
http_path = 'http://%s/tko/retrieve_logs.cgi?localonly&job=%s' % (
host, job_path)
else:
http_path = 'http://%s%s' % (host, job_path)
try:
# HACK: This urlopen call isn't forwarding HTTP headers correctly. This
# leads to uberproxy sitting between client (orignator of this request)
# and shard (target of the request) to redirect to the the login page.
# We detect this condition and reject the target shard as a viable
# redirect. The implication is that we will not redirect to the shard
# even if the user could themselves access the shard with the correct
# credentials.
u = utils.urlopen(http_path)
redirected_url = u.geturl()
if 'accounts.google.com' in redirected_url:
return None
# On Vms the shard name is set to the default gateway but the
# browser used to navigate frontends (that runs on the host of
# the vms) is immune to the same NAT routing the vms have, so we
# need to replace the gateway with 'localhost'.
if utils.DEFAULT_VM_GATEWAY in host:
normalized_host = host.replace(utils.DEFAULT_VM_GATEWAY, 'localhost')
else:
try:
normalized_host = utils.normalize_hostname(host)
except socket.herror:
# Ignore error: 'socket.herror: [Errno 1] Unknown host'
# This can happen when reverse name lookup is not stable.
normalized_host = host
return 'http', normalized_host, job_path
except urllib2.URLError:
return None
def _get_tpool_args(hosts, job_path, is_shard, host_set):
"""Get a list of arguments to be passed to multiprocessing.pool.ThreadPool.
@param hosts: a list of host names.
@param job_path: a requested job path.
@param is_shard: True if hosts are shards, False otherwise.
@param host_set: a Set to filter out duplicated hosts.
@return: a list of dictionaries to be used as input of _check_result().
"""
args = []
for host in hosts:
host = host.strip()
if host and host != 'localhost' and host not in host_set:
host_set.add(host)
arg = {'host': host, 'job_path': job_path, 'shard': is_shard}
args.append(arg)
return args
def find_repository_host(job_path):
"""Find the machine holding the given logs and return a URL to the logs"""
site_repo_info = site_find_repository_host(job_path)
if site_repo_info is not None:
return site_repo_info
# This cgi script is run only in client (cautotest) and shards.
# Drones do not run this script when receiving '/results/...' request.
# Only client should check drones and shards for the requested log.
# Also restricted users do not have access to drones or shards,
# always point them to localhost or google storage.
if (not server_utils.is_shard() and
not server_utils.is_restricted_user(os.environ.get('REMOTE_USER'))):
drones = system_utils.get_drones()
shards = system_utils.get_shards()
host_set = set()
tpool_args = _get_tpool_args(drones, job_path, False, host_set)
tpool_args += _get_tpool_args(shards, job_path, True, host_set)
tpool = pool.ThreadPool()
for result_path in tpool.imap_unordered(_check_result, tpool_args):
if result_path:
return result_path
# If the URL requested is a test result, it is now either on the local
# host or in Google Storage.
if job_path.startswith('/results/'):
# We only care about the path after '/results/'.
job_relative_path = job_path[9:]
if not _local_only and not os.path.exists(
os.path.join('/usr/local/autotest/results',
job_relative_path)):
gsuri = utils.get_offload_gsuri().split('gs://')[1]
return ['https', VIEWER_PREFIX, gsuri + job_relative_path]
def get_full_url(info, log_path):
if info is not None:
protocol, host, path = info
prefix = '%s://%s' % (protocol, host)
else:
prefix = ''
path = log_path
if _is_json_request:
return '%s/tko/jsonp_fetcher.cgi?%s' % (prefix,
os.environ['QUERY_STRING'])
else:
return prefix + path
log_path = _get_requested_path()
info = find_repository_host(log_path)
site_retrieve_logs(log_path)
print _PAGE % get_full_url(info, log_path)