#!/usr/bin/python import cgi import cgitb from spider import * cgitb.enable() def validate_input(uri): """ The HTML parser apparently accepts any URI without the http part, so if the user inputs such a URI we have to strip it off. Also we need to check if this particular URI exists """ if uri.find('http://') != -1: trail = uri[7:].find('/') if trail != -1: site = uri[7:trail+7] else: site = uri[7:] elif uri.find('https://') != -1: trail = uri[8:].find('/') if trail != -1: site = uri[8:trail+8] else: site = uri[8:] else: """Find the site URI without the protocol or the trailing path """ trail = uri.find('/') if trail != -1: site = uri[:trail] else: site = uri return site def print_table(list): print "" for val in list: print """""" print """""" print """""" print """

By """ % (list[val][1]) print """%s
""" % (list[val][0]) if int(list[val][2]) == 0: print "All Rights Reserved" else : """ The following snippet of code adds the license icons one-by-one as required to indicate the license the Flickr photos come with. Note that the image icons are stored in dig space""" #Print the generic CC icons print """Has License

""" if int(list[val][2]) == 1: print """

""" if int(list[val][2]) == 2: print """

""" if int(list[val][2]) == 3: print """

""" if int(list[val][2]) == 4: print """

""" if int(list[val][2]) == 5: print """

""" if int(list[val][2]) == 6: print """

""" print """

""" def main(): try: print "Content-type: text/html" print print """ Creative Commons Validator for Flickr Images

Creative Commons License Validator for Flickr Images

""" form = cgi.FieldStorage() uri = form.getvalue("uri" , "") print """

""" if uri != "": #somebody has put in a value for the blog URI #TODO: Check whether it's a valid URI result = crawl(validate_input(form.getvalue("uri" , "")), '/') attr_given = result[0] attr_not_given = result[1] nameless = result[2] n_attr_given = len(attr_given) n_attr_not_given = len(attr_not_given) n_nameless = len(nameless) print """ """ print """Results for the site """ % (uri) print """%s.
""" % (uri) if int(n_attr_not_given) > 0: print """

Found %s license violations for the following images.

""" % (n_attr_not_given) print_table(attr_not_given) else: print "

No license violations detected.

" if int(n_attr_given) > 0: print """

These %s Flickr images were embedded in the site with proper attribution.

""" % (n_attr_given) print_table(attr_given) if int(n_nameless) > 0: print """

The following images were found in the site, but Flickr does not seem to have a record of the owners of the images.

""" print_table(nameless) print """""" except: print "

Oops. An error occurred!" cgi.print_exception() if __name__ == "__main__": main()