#!/usr/bin/env python # Copyright (c) 2014 Sebastian Noack # # Permission is hereby granted, free of charge, to any person obtaining # a copy of this software and associated documentation files (the # "Software"), to deal in the Software without restriction, including # without limitation the rights to use, copy, modify, merge, publish, # distribute, sublicense, and/or sell copies of the Software, and to # permit persons to whom the Software is furnished to do so, subject to # the following conditions: # # The above copyright notice and this permission notice shall be included # in all copies or substantial portions of the Software. # # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, # EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF # MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. # IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY # CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, # TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE # SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. import urllib, BeautifulSoup, re REGIONS = ["", "ar", "au", "at", "be", "br", "bg", "ca", "cl", "cn", "co", "cr", "hr", "cz", "dk", "ec", "eg", "ee", "fi", "fr", "de", "gr", "gt", "hk", "hu", "igo", "in", "ie", "il", "it", "jp", "lu", "mk", "my", "mt", "mx", "nl", "nz", "no", "pe", "ph", "pl", "pt", "pr", "ro", "rs", "sg", "si", "za", "kr", "es", "se", "ch", "tw", "th", "uk", "scotland", "ug", "us", "ve", "vn"] TMPL = '''\ CC%(name)s: { licenseName: 'Creative Commons %(title)s', canonicalUrl: ['%(url)s'], identifier: 'CC-%(identifier)s', licenseFragments: [] }, ''' for license in ('by', 'by-sa'): for region in REGIONS: soup = BeautifulSoup.BeautifulSoup(urllib.urlopen('https://creativecommons.org/licenses/%s/0/%s' % (license, region)).read()) for link in soup.find(id='suggested_licenses').findAll('a'): url = link.get('href') title = link.text identifier = re.sub(r'.*/licenses/|/$', '', url).replace('/', '-') print TMPL % { 'name': identifier.replace('-', '').replace('.', '').lower(), 'url': url + 'legalcode', 'title': title, 'identifier': identifier.upper() }