| #!/usr/bin/env python |
| # |
| # |
| # Licensed to the Apache Software Foundation (ASF) under one |
| # or more contributor license agreements. See the NOTICE file |
| # distributed with this work for additional information |
| # regarding copyright ownership. The ASF licenses this file |
| # to you under the Apache License, Version 2.0 (the |
| # "License"); you may not use this file except in compliance |
| # with the License. You may obtain a copy of the License at |
| # |
| # http://www.apache.org/licenses/LICENSE-2.0 |
| # |
| # Unless required by applicable law or agreed to in writing, |
| # software distributed under the License is distributed on an |
| # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| # KIND, either express or implied. See the License for the |
| # specific language governing permissions and limitations |
| # under the License. |
| # |
| # |
| """This is a pre-commit hook that checks whether the contents of PO files |
| committed to the repository are encoded in UTF-8. |
| """ |
| |
| import codecs |
| import string |
| import sys |
| import subprocess |
| from svn import core, fs, delta, repos |
| |
| # Set to the path of the 'msgfmt' executable to use msgfmt to check |
| # the syntax of the po file |
| |
| USE_MSGFMT = None |
| |
| if USE_MSGFMT is not None: |
| class MsgFmtChecker: |
| def __init__(self): |
| self.pipe = subprocess.Popen([USE_MSGFMT, "-c", "-o", "/dev/null", "-"], |
| stdin=subprocess.PIPE, |
| close_fds=sys.platform != "win32") |
| self.io_error = 0 |
| |
| def write(self, data): |
| if self.io_error: |
| return |
| try: |
| self.pipe.stdin.write(data) |
| except IOError: |
| self.io_error = 1 |
| |
| def close(self): |
| try: |
| self.pipe.stdin.close() |
| except IOError: |
| self.io_error = 1 |
| return self.pipe.wait() == 0 and not self.io_error |
| else: |
| class MsgFmtChecker: |
| def write(self, data): |
| pass |
| def close(self): |
| return 1 |
| |
| |
| class ChangeReceiver(delta.Editor): |
| def __init__(self, txn_root, base_root, pool): |
| self.txn_root = txn_root |
| self.base_root = base_root |
| self.pool = pool |
| |
| def add_file(self, path, parent_baton, |
| copyfrom_path, copyfrom_revision, file_pool): |
| return [0, path] |
| |
| def open_file(self, path, parent_baton, base_revision, file_pool): |
| return [0, path] |
| |
| def apply_textdelta(self, file_baton, base_checksum): |
| file_baton[0] = 1 |
| # no handler |
| return None |
| |
| def close_file(self, file_baton, text_checksum): |
| changed, path = file_baton |
| if len(path) < 3 or path[-3:] != '.po' or not changed: |
| # This is not a .po file, or it hasn't changed |
| return |
| |
| try: |
| # Read the file contents through a validating UTF-8 decoder |
| subpool = core.svn_pool_create(self.pool) |
| checker = MsgFmtChecker() |
| try: |
| stream = core.Stream(fs.file_contents(self.txn_root, path, subpool)) |
| reader = codecs.getreader('UTF-8')(stream, 'strict') |
| writer = codecs.getwriter('UTF-8')(checker, 'strict') |
| while True: |
| data = reader.read(core.SVN_STREAM_CHUNK_SIZE) |
| if not data: |
| break |
| writer.write(data) |
| if not checker.close(): |
| sys.exit("PO format check failed for '" + path + "'") |
| except UnicodeError: |
| sys.exit("PO file is not in UTF-8: '" + path + "'") |
| finally: |
| core.svn_pool_destroy(subpool) |
| |
| |
| def check_po(pool, repos_path, txn): |
| def authz_cb(root, path, pool): |
| return 1 |
| |
| fs_ptr = repos.fs(repos.open(repos_path, pool)) |
| txn_ptr = fs.open_txn(fs_ptr, txn, pool) |
| txn_root = fs.txn_root(txn_ptr, pool) |
| base_root = fs.revision_root(fs_ptr, fs.txn_base_revision(txn_ptr), pool) |
| editor = ChangeReceiver(txn_root, base_root, pool) |
| e_ptr, e_baton = delta.make_editor(editor, pool) |
| repos.dir_delta(base_root, '', '', txn_root, '', |
| e_ptr, e_baton, authz_cb, 0, 1, 0, 0, pool) |
| |
| |
| if __name__ == '__main__': |
| assert len(sys.argv) == 3 |
| core.run_app(check_po, sys.argv[1], sys.argv[2]) |