CofeehousePy/deps/numpy/tools/cythonize.py

#!/usr/bin/env python3
""" cythonize

Cythonize pyx files into C files as needed.

Usage: cythonize [root_dir]

Default [root_dir] is 'numpy'.

Checks pyx files to see if they have been changed relative to their
corresponding C files.  If they have, then runs cython on these files to
recreate the C files.

The script thinks that the pyx files have changed relative to the C files
by comparing hashes stored in a database file.

Simple script to invoke Cython (and Tempita) on all .pyx (.pyx.in)
files; while waiting for a proper build system. Uses file hashes to
figure out if rebuild is needed.

For now, this script should be run by developers when changing Cython files
only, and the resulting C files checked in, so that end-users (and Python-only
developers) do not get the Cython/Tempita dependencies.

Originally written by Dag Sverre Seljebotn, and copied here from:

https://raw.github.com/dagss/private-scipy-refactor/cythonize/cythonize.py

Note: this script does not check any of the dependent C libraries; it only
operates on the Cython .pyx files.
"""

import os
import re
import sys
import hashlib
import subprocess

HASH_FILE = 'cythonize.dat'
DEFAULT_ROOT = 'numpy'
VENDOR = 'NumPy'

# WindowsError is not defined on unix systems
try:
    WindowsError
except NameError:
    WindowsError = None

#
# Rules
#
def process_pyx(fromfile, tofile):
    flags = ['-3', '--fast-fail']
    if tofile.endswith('.cxx'):
        flags.append('--cplus')

    try:
        # try the cython in the installed python first (somewhat related to scipy/scipy#2397)
        from Cython.Compiler.Version import version as cython_version
    except ImportError:
        # The `cython` command need not point to the version installed in the
        # Python running this script, so raise an error to avoid the chance of
        # using the wrong version of Cython.
        raise OSError('Cython needs to be installed in Python as a module')
    else:
        # check the version, and invoke through python
        from distutils.version import LooseVersion

        # Cython 0.29.21 is required for Python 3.9 and there are
        # other fixes in the 0.29 series that are needed even for earlier
        # Python versions.
        # Note: keep in sync with that in pyproject.toml
        required_version = LooseVersion('0.29.21')

        if LooseVersion(cython_version) < required_version:
            raise RuntimeError(f'Building {VENDOR} requires Cython >= {required_version}')
        subprocess.check_call(
            [sys.executable, '-m', 'cython'] + flags + ["-o", tofile, fromfile])


def process_tempita_pyx(fromfile, tofile):
    import npy_tempita as tempita

    assert fromfile.endswith('.pyx.in')
    with open(fromfile, "r") as f:
        tmpl = f.read()
    pyxcontent = tempita.sub(tmpl)
    pyxfile = fromfile[:-len('.pyx.in')] + '.pyx'
    with open(pyxfile, "w") as f:
        f.write(pyxcontent)
    process_pyx(pyxfile, tofile)


def process_tempita_pyd(fromfile, tofile):
    import npy_tempita as tempita

    assert fromfile.endswith('.pxd.in')
    assert tofile.endswith('.pxd')
    with open(fromfile, "r") as f:
        tmpl = f.read()
    pyxcontent = tempita.sub(tmpl)
    with open(tofile, "w") as f:
        f.write(pyxcontent)

def process_tempita_pxi(fromfile, tofile):
    import npy_tempita as tempita

    assert fromfile.endswith('.pxi.in')
    assert tofile.endswith('.pxi')
    with open(fromfile, "r") as f:
        tmpl = f.read()
    pyxcontent = tempita.sub(tmpl)
    with open(tofile, "w") as f:
        f.write(pyxcontent)

def process_tempita_pxd(fromfile, tofile):
    import npy_tempita as tempita

    assert fromfile.endswith('.pxd.in')
    assert tofile.endswith('.pxd')
    with open(fromfile, "r") as f:
        tmpl = f.read()
    pyxcontent = tempita.sub(tmpl)
    with open(tofile, "w") as f:
        f.write(pyxcontent)

rules = {
    # fromext : function, toext
    '.pyx' : (process_pyx, '.c'),
    '.pyx.in' : (process_tempita_pyx, '.c'),
    '.pxi.in' : (process_tempita_pxi, '.pxi'),
    '.pxd.in' : (process_tempita_pxd, '.pxd'),
    '.pyd.in' : (process_tempita_pyd, '.pyd'),
    }
#
# Hash db
#
def load_hashes(filename):
    # Return { filename : (sha1 of input, sha1 of output) }
    if os.path.isfile(filename):
        hashes = {}
        with open(filename, 'r') as f:
            for line in f:
                filename, inhash, outhash = line.split()
                hashes[filename] = (inhash, outhash)
    else:
        hashes = {}
    return hashes

def save_hashes(hash_db, filename):
    with open(filename, 'w') as f:
        for key, value in sorted(hash_db.items()):
            f.write("%s %s %s\n" % (key, value[0], value[1]))

def sha1_of_file(filename):
    h = hashlib.sha1()
    with open(filename, "rb") as f:
        h.update(f.read())
    return h.hexdigest()

#
# Main program
#

def normpath(path):
    path = path.replace(os.sep, '/')
    if path.startswith('./'):
        path = path[2:]
    return path

def get_hash(frompath, topath):
    from_hash = sha1_of_file(frompath)
    to_hash = sha1_of_file(topath) if os.path.exists(topath) else None
    return (from_hash, to_hash)

def process(path, fromfile, tofile, processor_function, hash_db):
    fullfrompath = os.path.join(path, fromfile)
    fulltopath = os.path.join(path, tofile)
    current_hash = get_hash(fullfrompath, fulltopath)
    if current_hash == hash_db.get(normpath(fullfrompath), None):
        print(f'{fullfrompath} has not changed')
        return

    orig_cwd = os.getcwd()
    try:
        os.chdir(path)
        print(f'Processing {fullfrompath}')
        processor_function(fromfile, tofile)
    finally:
        os.chdir(orig_cwd)
    # changed target file, recompute hash
    current_hash = get_hash(fullfrompath, fulltopath)
    # store hash in db
    hash_db[normpath(fullfrompath)] = current_hash


def find_process_files(root_dir):
    hash_db = load_hashes(HASH_FILE)
    files  = [x for x in os.listdir(root_dir) if not os.path.isdir(x)]
    # .pxi or .pxi.in files are most likely dependencies for
    # .pyx files, so we need to process them first
    files.sort(key=lambda name: (name.endswith('.pxi') or
                                 name.endswith('.pxi.in') or
                                 name.endswith('.pxd.in')),
               reverse=True)

    for filename in files:
        in_file = os.path.join(root_dir, filename + ".in")
        for fromext, value in rules.items():
            if filename.endswith(fromext):
                if not value:
                    break
                function, toext = value
                if toext == '.c':
                    with open(os.path.join(root_dir, filename), 'rb') as f:
                        data = f.read()
                        m = re.search(br"^\s*#\s*distutils:\s*language\s*=\s*c\+\+\s*$", data, re.I|re.M)
                        if m:
                            toext = ".cxx"
                fromfile = filename
                tofile = filename[:-len(fromext)] + toext
                process(root_dir, fromfile, tofile, function, hash_db)
                save_hashes(hash_db, HASH_FILE)
                break

def main():
    try:
        root_dir = sys.argv[1]
    except IndexError:
        root_dir = DEFAULT_ROOT
    find_process_files(root_dir)


if __name__ == '__main__':
    main()
Added numpy 2021-01-13 04:41:40 +01:00			`#!/usr/bin/env python3`
			`""" cythonize`

			`Cythonize pyx files into C files as needed.`

			`Usage: cythonize [root_dir]`

			`Default [root_dir] is 'numpy'.`

			`Checks pyx files to see if they have been changed relative to their`
			`corresponding C files. If they have, then runs cython on these files to`
			`recreate the C files.`

			`The script thinks that the pyx files have changed relative to the C files`
			`by comparing hashes stored in a database file.`

			`Simple script to invoke Cython (and Tempita) on all .pyx (.pyx.in)`
			`files; while waiting for a proper build system. Uses file hashes to`
			`figure out if rebuild is needed.`

			`For now, this script should be run by developers when changing Cython files`
			`only, and the resulting C files checked in, so that end-users (and Python-only`
			`developers) do not get the Cython/Tempita dependencies.`

			`Originally written by Dag Sverre Seljebotn, and copied here from:`

			`https://raw.github.com/dagss/private-scipy-refactor/cythonize/cythonize.py`

			`Note: this script does not check any of the dependent C libraries; it only`
			`operates on the Cython .pyx files.`
			`"""`

			`import os`
			`import re`
			`import sys`
			`import hashlib`
			`import subprocess`

			`HASH_FILE = 'cythonize.dat'`
			`DEFAULT_ROOT = 'numpy'`
			`VENDOR = 'NumPy'`

			`# WindowsError is not defined on unix systems`
			`try:`
			`WindowsError`
			`except NameError:`
			`WindowsError = None`

			`#`
			`# Rules`
			`#`
			`def process_pyx(fromfile, tofile):`
			`flags = ['-3', '--fast-fail']`
			`if tofile.endswith('.cxx'):`
			`flags.append('--cplus')`

			`try:`
			`# try the cython in the installed python first (somewhat related to scipy/scipy#2397)`
			`from Cython.Compiler.Version import version as cython_version`
			`except ImportError:`
			# The `cython` command need not point to the version installed in the
			`# Python running this script, so raise an error to avoid the chance of`
			`# using the wrong version of Cython.`
			`raise OSError('Cython needs to be installed in Python as a module')`
			`else:`
			`# check the version, and invoke through python`
			`from distutils.version import LooseVersion`

			`# Cython 0.29.21 is required for Python 3.9 and there are`
			`# other fixes in the 0.29 series that are needed even for earlier`
			`# Python versions.`
			`# Note: keep in sync with that in pyproject.toml`
			`required_version = LooseVersion('0.29.21')`

			`if LooseVersion(cython_version) < required_version:`
			`raise RuntimeError(f'Building {VENDOR} requires Cython >= {required_version}')`
			`subprocess.check_call(`
			`[sys.executable, '-m', 'cython'] + flags + ["-o", tofile, fromfile])`


			`def process_tempita_pyx(fromfile, tofile):`
			`import npy_tempita as tempita`

			`assert fromfile.endswith('.pyx.in')`
			`with open(fromfile, "r") as f:`
			`tmpl = f.read()`
			`pyxcontent = tempita.sub(tmpl)`
			`pyxfile = fromfile[:-len('.pyx.in')] + '.pyx'`
			`with open(pyxfile, "w") as f:`
			`f.write(pyxcontent)`
			`process_pyx(pyxfile, tofile)`


			`def process_tempita_pyd(fromfile, tofile):`
			`import npy_tempita as tempita`

			`assert fromfile.endswith('.pxd.in')`
			`assert tofile.endswith('.pxd')`
			`with open(fromfile, "r") as f:`
			`tmpl = f.read()`
			`pyxcontent = tempita.sub(tmpl)`
			`with open(tofile, "w") as f:`
			`f.write(pyxcontent)`

			`def process_tempita_pxi(fromfile, tofile):`
			`import npy_tempita as tempita`

			`assert fromfile.endswith('.pxi.in')`
			`assert tofile.endswith('.pxi')`
			`with open(fromfile, "r") as f:`
			`tmpl = f.read()`
			`pyxcontent = tempita.sub(tmpl)`
			`with open(tofile, "w") as f:`
			`f.write(pyxcontent)`

			`def process_tempita_pxd(fromfile, tofile):`
			`import npy_tempita as tempita`

			`assert fromfile.endswith('.pxd.in')`
			`assert tofile.endswith('.pxd')`
			`with open(fromfile, "r") as f:`
			`tmpl = f.read()`
			`pyxcontent = tempita.sub(tmpl)`
			`with open(tofile, "w") as f:`
			`f.write(pyxcontent)`

			`rules = {`
			`# fromext : function, toext`
			`'.pyx' : (process_pyx, '.c'),`
			`'.pyx.in' : (process_tempita_pyx, '.c'),`
			`'.pxi.in' : (process_tempita_pxi, '.pxi'),`
			`'.pxd.in' : (process_tempita_pxd, '.pxd'),`
			`'.pyd.in' : (process_tempita_pyd, '.pyd'),`
			`}`
			`#`
			`# Hash db`
			`#`
			`def load_hashes(filename):`
			`# Return { filename : (sha1 of input, sha1 of output) }`
			`if os.path.isfile(filename):`
			`hashes = {}`
			`with open(filename, 'r') as f:`
			`for line in f:`
			`filename, inhash, outhash = line.split()`
			`hashes[filename] = (inhash, outhash)`
			`else:`
			`hashes = {}`
			`return hashes`

			`def save_hashes(hash_db, filename):`
			`with open(filename, 'w') as f:`
			`for key, value in sorted(hash_db.items()):`
			`f.write("%s %s %s\n" % (key, value[0], value[1]))`

			`def sha1_of_file(filename):`
			`h = hashlib.sha1()`
			`with open(filename, "rb") as f:`
			`h.update(f.read())`
			`return h.hexdigest()`

			`#`
			`# Main program`
			`#`

			`def normpath(path):`
			`path = path.replace(os.sep, '/')`
			`if path.startswith('./'):`
			`path = path[2:]`
			`return path`

			`def get_hash(frompath, topath):`
			`from_hash = sha1_of_file(frompath)`
			`to_hash = sha1_of_file(topath) if os.path.exists(topath) else None`
			`return (from_hash, to_hash)`

			`def process(path, fromfile, tofile, processor_function, hash_db):`
			`fullfrompath = os.path.join(path, fromfile)`
			`fulltopath = os.path.join(path, tofile)`
			`current_hash = get_hash(fullfrompath, fulltopath)`
			`if current_hash == hash_db.get(normpath(fullfrompath), None):`
			`print(f'{fullfrompath} has not changed')`
			`return`

			`orig_cwd = os.getcwd()`
			`try:`
			`os.chdir(path)`
			`print(f'Processing {fullfrompath}')`
			`processor_function(fromfile, tofile)`
			`finally:`
			`os.chdir(orig_cwd)`
			`# changed target file, recompute hash`
			`current_hash = get_hash(fullfrompath, fulltopath)`
			`# store hash in db`
			`hash_db[normpath(fullfrompath)] = current_hash`


			`def find_process_files(root_dir):`
			`hash_db = load_hashes(HASH_FILE)`
			`files = [x for x in os.listdir(root_dir) if not os.path.isdir(x)]`
			`# .pxi or .pxi.in files are most likely dependencies for`
			`# .pyx files, so we need to process them first`
			`files.sort(key=lambda name: (name.endswith('.pxi') or`
			`name.endswith('.pxi.in') or`
			`name.endswith('.pxd.in')),`
			`reverse=True)`

			`for filename in files:`
			`in_file = os.path.join(root_dir, filename + ".in")`
			`for fromext, value in rules.items():`
			`if filename.endswith(fromext):`
			`if not value:`
			`break`
			`function, toext = value`
			`if toext == '.c':`
			`with open(os.path.join(root_dir, filename), 'rb') as f:`
			`data = f.read()`
			`m = re.search(br"^\s#\sdistutils:\slanguage\s=\sc\+\+\s$", data, re.I\|re.M)`
			`if m:`
			`toext = ".cxx"`
			`fromfile = filename`
			`tofile = filename[:-len(fromext)] + toext`
			`process(root_dir, fromfile, tofile, function, hash_db)`
			`save_hashes(hash_db, HASH_FILE)`
			`break`

			`def main():`
			`try:`
			`root_dir = sys.argv[1]`
			`except IndexError:`
			`root_dir = DEFAULT_ROOT`
			`find_process_files(root_dir)`


			`if __name__ == '__main__':`
			`main()`