普通文本  |  225行  |  7.11 KB

# Copyright (c) 2012 The Chromium Authors. All rights reserved.
# Use of this source code is governed by a BSD-style license that can be
# found in the LICENSE file.

"""Test server for generating nested iframes with different sites.

Very simple python server for creating a bunch of iframes. The page generation
is randomized based on query parameters.  See the __init__ function of the
Params class for a description of the parameters.

This server relies on gevent. On Ubuntu, install it via:

  sudo apt-get install python-gevent

Run the server using

  python iframe_server.py

To use the server, run chrome as follows:

  google-chrome --host-resolver-rules='map *.invalid 127.0.0.1'

Change 127.0.0.1 to be the IP of the machine this server is running on. Then
in this chrome instance, navigate to any domain in .invalid
(eg., http://1.invalid:8090) to run this test.

"""

import colorsys
import copy
import random
import urllib
import urlparse

from gevent import pywsgi # pylint: disable=F0401

MAIN_PAGE = """
<html>
  <head>
    <style>
      body {
        background-color: %(color)s;
      }
    </style>
  </head>
  <body>
    <center>
      <h1><a href="%(url)s">%(site)s</a></h1>
      <p><small>%(url)s</small>
    </center>
    <br />
    %(iframe_html)s
  </body>
</html>
"""

IFRAME_FRAGMENT = """
<iframe src="%(src)s" width="%(width)s" height="%(height)s">
</iframe>
"""

class Params(object):
  """Simple object for holding parameters"""
  def __init__(self, query_dict):
    # Basic params:
    #  nframes is how many frames per page.
    #  nsites is how many sites to random choose out of.
    #  depth is how deep to make the frame tree
    #  pattern specifies how the sites are layed out per depth. An empty string
    #      uses a random N = [0, nsites] each time to generate a N.invalid URL.
    #      Otherwise sepcify with single letters like 'ABCA' and frame
    #      A.invalid will embed B.invalid will embed C.invalid will embed A.
    #  jitter is the amount of randomness applied to nframes and nsites.
    #      Should be from [0,1]. 0.0 means no jitter.
    #  size_jitter is like jitter, but for width and height.
    self.nframes = int(query_dict.get('nframes', [4] )[0])
    self.nsites = int(query_dict.get('nsites', [10] )[0])
    self.depth = int(query_dict.get('depth', [1] )[0])
    self.jitter = float(query_dict.get('jitter', [0] )[0])
    self.size_jitter = float(query_dict.get('size_jitter', [0.5] )[0])
    self.pattern = query_dict.get('pattern', [''] )[0]
    self.pattern_pos = int(query_dict.get('pattern_pos', [0] )[0])

    # Size parameters. Values are percentages.
    self.width = int(query_dict.get('width', [60])[0])
    self.height = int(query_dict.get('height', [50])[0])

    # Pass the random seed so our pages are reproduceable.
    self.seed = int(query_dict.get('seed',
                                   [random.randint(0, 2147483647)])[0])


def get_site(urlpath):
  """Takes a urlparse object and finds its approximate site.

  Site is defined as registered domain name + scheme. We approximate
  registered domain name by preserving the last 2 elements of the DNS
  name. This breaks for domains like co.uk.
  """
  no_port = urlpath.netloc.split(':')[0]
  host_parts = no_port.split('.')
  site_host = '.'.join(host_parts[-2:])
  return '%s://%s' % (urlpath.scheme, site_host)


def generate_host(rand, params):
  """Generates the host to be used as an iframes source.

  Uses the .invalid domain to ensure DNS will not resolve to any real
  address.
  """
  if params.pattern:
    host = params.pattern[params.pattern_pos]
    params.pattern_pos = (params.pattern_pos + 1) % len(params.pattern)
  else:
    host = rand.randint(1, apply_jitter(rand, params.jitter, params.nsites))
  return '%s.invalid' % host


def apply_jitter(rand, jitter, n):
  """Reduce n by random amount from [0, jitter]. Ensures result is >=1."""
  if jitter <= 0.001:
    return n
  v = n - int(n * rand.uniform(0, jitter))
  if v:
    return v
  else:
    return 1


def get_color_for_site(site):
  """Generate a stable (and pretty-ish) color for a site."""
  val = hash(site)
  # The constants below are arbitrary chosen emperically to look "pretty."
  # HSV is used because it is easier to control the color than RGB.
  # Reducing the H to 0.6 produces a good range of colors. Preserving
  # > 0.5 saturation and value means the colors won't be too washed out.
  h = (val % 100)/100.0 * 0.6
  s = 1.0 - (int(val/100) % 100)/200.
  v = 1.0 - (int(val/10000) % 100)/200.0
  (r, g, b) = colorsys.hsv_to_rgb(h, s, v)
  return 'rgb(%d, %d, %d)' % (int(r * 255), int(g * 255), int(b * 255))


def make_src(scheme, netloc, path, params):
  """Constructs the src url that will recreate the given params."""
  if path == '/':
    path = ''
  return '%(scheme)s://%(netloc)s%(path)s?%(params)s' % {
      'scheme': scheme,
      'netloc': netloc,
      'path': path,
      'params': urllib.urlencode(params.__dict__),
      }


def make_iframe_html(urlpath, params):
  """Produces the HTML fragment for the iframe."""
  if (params.depth <= 0):
    return ''
  # Ensure a stable random number per iframe.
  rand = random.Random()
  rand.seed(params.seed)

  netloc_paths = urlpath.netloc.split(':')
  netloc_paths[0] = generate_host(rand, params)

  width = apply_jitter(rand, params.size_jitter, params.width)
  height = apply_jitter(rand, params.size_jitter, params.height)
  iframe_params = {
      'src': make_src(urlpath.scheme, ':'.join(netloc_paths),
                      urlpath.path, params),
      'width': '%d%%' % width,
      'height': '%d%%' % height,
      }
  return IFRAME_FRAGMENT % iframe_params


def create_html(environ):
  """Creates the current HTML page. Also parses out query parameters."""
  urlpath = urlparse.urlparse('%s://%s%s?%s' % (
      environ['wsgi.url_scheme'],
      environ['HTTP_HOST'],
      environ['PATH_INFO'],
      environ['QUERY_STRING']))
  site = get_site(urlpath)
  params = Params(urlparse.parse_qs(urlpath.query))

  rand = random.Random()
  rand.seed(params.seed)

  iframe_htmls = []
  for frame in xrange(0, apply_jitter(rand, params.jitter, params.nframes)):
    # Copy current parameters into iframe and make modifications
    # for the recursive generation.
    iframe_params = copy.copy(params)
    iframe_params.depth = params.depth - 1
    # Base the new seed off the current seed, but have it skip enough that
    # different frame trees are unlikely to collide. Numbers and skips
    # not chosen in any scientific manner at all.
    iframe_params.seed = params.seed + (frame + 1) * (
        1000000 + params.depth + 333)
    iframe_htmls.append(make_iframe_html(urlpath, iframe_params))
  template_params = dict(params.__dict__)
  template_params.update({
      'color': get_color_for_site(site),
      'iframe_html': '\n'.join(iframe_htmls),
      'site': site,
      'url': make_src(urlpath.scheme, urlpath.netloc, urlpath.path, params),
      })
  return MAIN_PAGE % template_params


def application(environ, start_response):
  start_response('200 OK', [('Content-Type', 'text/html')])
  if environ['PATH_INFO'] == '/favicon.ico':
    yield ''
  else:
    yield create_html(environ)


server = pywsgi.WSGIServer(('', 8090), application)

server.serve_forever()