#!/usr/bin/env python # Copyright 2014 The Chromium Authors. All rights reserved. # Use of this source code is governed by a BSD-style license that can be # found in the LICENSE file. """Takes the JSON files in components/domain_reliability/baked_in_configs and encodes their contents as an array of C strings that gets compiled in to Chrome and loaded at runtime.""" import ast import json import os import sys # A whitelist of domains that the script will accept when baking configs in to # Chrome, to ensure incorrect ones are not added accidentally. Subdomains of # whitelist entries are also allowed (e.g. maps.google.com, ssl.gstatic.com). DOMAIN_WHITELIST = ( '2mdn.net', 'admob.biz', 'admob.co.in', 'admob.co.kr', 'admob.co.nz', 'admob.co.uk', 'admob.co.za', 'admob.com', 'admob.com.br', 'admob.com.es', 'admob.com.fr', 'admob.com.mx', 'admob.com.pt', 'admob.de', 'admob.dk', 'admob.es', 'admob.fi', 'admob.fr', 'admob.gr', 'admob.hk', 'admob.ie', 'admob.in', 'admob.it', 'admob.jp', 'admob.kr', 'admob.mobi', 'admob.no', 'admob.ph', 'admob.pt', 'admob.sg', 'admob.tw', 'admob.us', 'admob.vn', 'dartmotif.com', 'doubleclick.com', 'doubleclick.ne.jp', 'doubleclick.net', 'doubleclickusercontent.com', 'g.co', 'ggpht.com', 'gmodules.com', 'goo.gl', 'google-analytics.com', 'google-syndication.com', 'google.ac', 'google.ad', 'google.ae', 'google.af', 'google.ag', 'google.al', 'google.am', 'google.as', 'google.at', 'google.az', 'google.ba', 'google.be', 'google.bf', 'google.bg', 'google.bi', 'google.bj', 'google.bs', 'google.bt', 'google.by', 'google.ca', 'google.cat', 'google.cc', 'google.cd', 'google.cf', 'google.cg', 'google.ch', 'google.ci', 'google.cl', 'google.cm', 'google.cn', 'google.co.ao', 'google.co.bw', 'google.co.ck', 'google.co.cr', 'google.co.hu', 'google.co.id', 'google.co.il', 'google.co.im', 'google.co.in', 'google.co.je', 'google.co.jp', 'google.co.ke', 'google.co.kr', 'google.co.ls', 'google.co.ma', 'google.co.mz', 'google.co.nz', 'google.co.th', 'google.co.tz', 'google.co.ug', 'google.co.uk', 'google.co.uz', 'google.co.ve', 'google.co.vi', 'google.co.za', 'google.co.zm', 'google.co.zw', 'google.com', 'google.com.af', 'google.com.ag', 'google.com.ai', 'google.com.ar', 'google.com.au', 'google.com.bd', 'google.com.bh', 'google.com.bn', 'google.com.bo', 'google.com.br', 'google.com.by', 'google.com.bz', 'google.com.cn', 'google.com.co', 'google.com.cu', 'google.com.cy', 'google.com.do', 'google.com.ec', 'google.com.eg', 'google.com.et', 'google.com.fj', 'google.com.ge', 'google.com.gh', 'google.com.gi', 'google.com.gr', 'google.com.gt', 'google.com.hk', 'google.com.iq', 'google.com.jm', 'google.com.jo', 'google.com.kh', 'google.com.kw', 'google.com.lb', 'google.com.ly', 'google.com.mm', 'google.com.mt', 'google.com.mx', 'google.com.my', 'google.com.na', 'google.com.nf', 'google.com.ng', 'google.com.ni', 'google.com.np', 'google.com.nr', 'google.com.om', 'google.com.pa', 'google.com.pe', 'google.com.pg', 'google.com.ph', 'google.com.pk', 'google.com.pl', 'google.com.pr', 'google.com.py', 'google.com.qa', 'google.com.ru', 'google.com.sa', 'google.com.sb', 'google.com.sg', 'google.com.sl', 'google.com.sv', 'google.com.tj', 'google.com.tn', 'google.com.tr', 'google.com.tw', 'google.com.ua', 'google.com.uy', 'google.com.vc', 'google.com.ve', 'google.com.vn', 'google.cv', 'google.cz', 'google.de', 'google.dj', 'google.dk', 'google.dm', 'google.dz', 'google.ee', 'google.es', 'google.fi', 'google.fm', 'google.fr', 'google.ga', 'google.ge', 'google.gg', 'google.gl', 'google.gm', 'google.gp', 'google.gr', 'google.gy', 'google.hk', 'google.hn', 'google.hr', 'google.ht', 'google.hu', 'google.ie', 'google.im', 'google.info', 'google.iq', 'google.ir', 'google.is', 'google.it', 'google.it.ao', 'google.je', 'google.jo', 'google.jobs', 'google.jp', 'google.kg', 'google.ki', 'google.kz', 'google.la', 'google.li', 'google.lk', 'google.lt', 'google.lu', 'google.lv', 'google.md', 'google.me', 'google.mg', 'google.mk', 'google.ml', 'google.mn', 'google.ms', 'google.mu', 'google.mv', 'google.mw', 'google.ne', 'google.ne.jp', 'google.net', 'google.ng', 'google.nl', 'google.no', 'google.nr', 'google.nu', 'google.off.ai', 'google.org', 'google.pk', 'google.pl', 'google.pn', 'google.ps', 'google.pt', 'google.ro', 'google.rs', 'google.ru', 'google.rw', 'google.sc', 'google.se', 'google.sh', 'google.si', 'google.sk', 'google.sm', 'google.sn', 'google.so', 'google.sr', 'google.st', 'google.td', 'google.tg', 'google.tk', 'google.tl', 'google.tm', 'google.tn', 'google.to', 'google.tt', 'google.us', 'google.uz', 'google.vg', 'google.vu', 'google.ws', 'googleadservices.com', 'googlealumni.com', 'googleapis.com', 'googleapps.com', 'googlecbs.com', 'googlecommerce.com', 'googledrive.com', 'googleenterprise.com', 'googlegoro.com', 'googlehosted.com', 'googlepayments.com', 'googlesource.com', 'googlesyndication.com', 'googletagmanager.com', 'googletagservices.com', 'googleusercontent.com', 'googlevideo.com', 'gstatic.com', 'gvt1.com', 'gvt2.com', 'withgoogle.com', 'youtu.be', 'youtube-3rd-party.com', 'youtube-nocookie.com', 'youtube.ae', 'youtube.al', 'youtube.am', 'youtube.at', 'youtube.az', 'youtube.ba', 'youtube.be', 'youtube.bg', 'youtube.bh', 'youtube.bo', 'youtube.ca', 'youtube.cat', 'youtube.ch', 'youtube.cl', 'youtube.co', 'youtube.co.ae', 'youtube.co.at', 'youtube.co.hu', 'youtube.co.id', 'youtube.co.il', 'youtube.co.in', 'youtube.co.jp', 'youtube.co.ke', 'youtube.co.kr', 'youtube.co.ma', 'youtube.co.nz', 'youtube.co.th', 'youtube.co.ug', 'youtube.co.uk', 'youtube.co.ve', 'youtube.co.za', 'youtube.com', 'youtube.com.ar', 'youtube.com.au', 'youtube.com.az', 'youtube.com.bh', 'youtube.com.bo', 'youtube.com.br', 'youtube.com.by', 'youtube.com.co', 'youtube.com.do', 'youtube.com.ee', 'youtube.com.eg', 'youtube.com.es', 'youtube.com.gh', 'youtube.com.gr', 'youtube.com.gt', 'youtube.com.hk', 'youtube.com.hr', 'youtube.com.jm', 'youtube.com.jo', 'youtube.com.kw', 'youtube.com.lb', 'youtube.com.lv', 'youtube.com.mk', 'youtube.com.mt', 'youtube.com.mx', 'youtube.com.my', 'youtube.com.ng', 'youtube.com.om', 'youtube.com.pe', 'youtube.com.ph', 'youtube.com.pk', 'youtube.com.pt', 'youtube.com.qa', 'youtube.com.ro', 'youtube.com.sa', 'youtube.com.sg', 'youtube.com.tn', 'youtube.com.tr', 'youtube.com.tw', 'youtube.com.ua', 'youtube.com.uy', 'youtube.com.ve', 'youtube.cz', 'youtube.de', 'youtube.dk', 'youtube.ee', 'youtube.es', 'youtube.fi', 'youtube.fr', 'youtube.ge', 'youtube.gr', 'youtube.gt', 'youtube.hk', 'youtube.hr', 'youtube.hu', 'youtube.ie', 'youtube.in', 'youtube.is', 'youtube.it', 'youtube.jo', 'youtube.jp', 'youtube.kr', 'youtube.lk', 'youtube.lt', 'youtube.lv', 'youtube.ma', 'youtube.md', 'youtube.me', 'youtube.mk', 'youtube.mx', 'youtube.my', 'youtube.ng', 'youtube.nl', 'youtube.no', 'youtube.pe', 'youtube.ph', 'youtube.pk', 'youtube.pl', 'youtube.pr', 'youtube.pt', 'youtube.qa', 'youtube.ro', 'youtube.rs', 'youtube.ru', 'youtube.sa', 'youtube.se', 'youtube.sg', 'youtube.si', 'youtube.sk', 'youtube.sn', 'youtube.tn', 'youtube.ua', 'youtube.ug', 'youtube.uy', 'youtube.vn', 'youtubeeducation.com', 'youtubemobilesupport.com', 'ytimg.com' ) CC_HEADER = """// AUTOGENERATED FILE. DO NOT EDIT. // // (Update configs in components/domain_reliability/baked_in_configs and list // configs in components/domain_reliability/baked_in_configs.gypi instead.) #include "components/domain_reliability/baked_in_configs.h" #include namespace domain_reliability { const char* const kBakedInJsonConfigs[] = { """ CC_FOOTER = """ NULL }; } // namespace domain_reliability """ def read_json_files_from_gypi(gypi_file): with open(gypi_file, 'r') as f: gypi_text = f.read() json_files = ast.literal_eval(gypi_text)['variables']['baked_in_configs'] return json_files def domain_is_whitelisted(domain): return any(domain == e or domain.endswith('.' + e) for e in DOMAIN_WHITELIST) def quote_and_wrap_text(text, width=79, prefix=' "', suffix='"'): max_length = width - len(prefix) - len(suffix) output = prefix line_length = 0 for c in text: if c == "\"": c = "\\\"" elif c == "\n": c = "\\n" elif c == "\\": c = "\\\\" if line_length + len(c) > max_length: output += suffix + "\n" + prefix line_length = 0 output += c line_length += len(c) output += suffix return output def main(): if len(sys.argv) != 4: print >> sys.stderr, (('Usage: %s ' + ' ') % sys.argv[0]) print >> sys.stderr, sys.modules[__name__].__doc__ return 1 json_path = sys.argv[1] gypi_file = sys.argv[2] cpp_file = sys.argv[3] json_files = read_json_files_from_gypi(gypi_file) json_files = [ os.path.join(json_path, f) for f in json_files ] json_files = [ os.path.normpath(f) for f in json_files ] cpp_code = CC_HEADER found_invalid_config = False for json_file in json_files: with open(json_file, 'r') as f: json_text = f.read() try: config = json.loads(json_text) except ValueError, e: print >> sys.stderr, "%s: error parsing JSON: %s" % (json_file, e) found_invalid_config = True continue if 'monitored_domain' not in config: print >> sys.stderr, '%s: no monitored_domain found' % json_file found_invalid_config = True continue domain = config['monitored_domain'] if not domain_is_whitelisted(domain): print >> sys.stderr, ('%s: monitored_domain "%s" not in whitelist' % (json_file, domain)) found_invalid_config = True continue # Re-dump JSON to get a more compact representation. dumped_json_text = json.dumps(config, separators=(',', ':')) cpp_code += " // " + json_file + ":\n" cpp_code += quote_and_wrap_text(dumped_json_text) + ",\n" cpp_code += "\n" cpp_code += CC_FOOTER if found_invalid_config: return 1 with open(cpp_file, 'wb') as f: f.write(cpp_code) return 0 if __name__ == '__main__': sys.exit(main())