Spaces:
Paused
Paused
| #!/usr/bin/env python | |
| # Copyright 2018 Google Inc. | |
| # | |
| # Licensed under the Apache License, Version 2.0 (the "License"); | |
| # you may not use this file except in compliance with the License. | |
| # You may obtain a copy of the License at | |
| # | |
| # http://www.apache.org/licenses/LICENSE-2.0 | |
| # | |
| # Unless required by applicable law or agreed to in writing, software | |
| # distributed under the License is distributed on an "AS IS" BASIS, | |
| # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | |
| # See the License for the specific language governing permissions and | |
| # limitations under the License.! | |
| import codecs | |
| import os | |
| import string | |
| import subprocess | |
| import sys | |
| import platform | |
| from setuptools import Extension, setup | |
| from setuptools.command.build_ext import build_ext as _build_ext | |
| from setuptools.command.build_py import build_py as _build_py | |
| sys.path.append(os.path.join('.', 'test')) | |
| def long_description(): | |
| with codecs.open('README.md', 'r', 'utf-8') as f: | |
| long_description = f.read() | |
| return long_description | |
| exec(open('src/sentencepiece/_version.py').read()) | |
| def run_pkg_config(section, pkg_config_path=None): | |
| try: | |
| cmd = 'pkg-config sentencepiece --{}'.format(section) | |
| if pkg_config_path: | |
| cmd = 'env PKG_CONFIG_PATH={} {}'.format(pkg_config_path, cmd) | |
| output = subprocess.check_output(cmd, shell=True) | |
| if sys.version_info >= (3, 0, 0): | |
| output = output.decode('utf-8') | |
| except subprocess.CalledProcessError: | |
| sys.stderr.write('Failed to find sentencepiece pkg-config\n') | |
| sys.exit(1) | |
| return output.strip().split() | |
| def is_sentencepiece_installed(): | |
| try: | |
| subprocess.check_call('pkg-config sentencepiece --libs', shell=True) | |
| return True | |
| except subprocess.CalledProcessError: | |
| return False | |
| def get_cflags_and_libs(root): | |
| cflags = ['-std=c++17', '-I' + os.path.join(root, 'include')] | |
| libs = [] | |
| if os.path.exists(os.path.join(root, 'lib/pkgconfig/sentencepiece.pc')): | |
| libs = [ | |
| os.path.join(root, 'lib/libsentencepiece.a'), | |
| os.path.join(root, 'lib/libsentencepiece_train.a'), | |
| ] | |
| elif os.path.exists(os.path.join(root, 'lib64/pkgconfig/sentencepiece.pc')): | |
| libs = [ | |
| os.path.join(root, 'lib64/libsentencepiece.a'), | |
| os.path.join(root, 'lib64/libsentencepiece_train.a'), | |
| ] | |
| return cflags, libs | |
| class build_ext(_build_ext): | |
| """Override build_extension to run cmake.""" | |
| def build_extension(self, ext): | |
| cflags, libs = get_cflags_and_libs('../build/root') | |
| if len(libs) == 0: | |
| if is_sentencepiece_installed(): | |
| cflags = cflags + run_pkg_config('cflags') | |
| libs = run_pkg_config('libs') | |
| else: | |
| subprocess.check_call(['./build_bundled.sh', __version__]) | |
| cflags, libs = get_cflags_and_libs('./build/root') | |
| # Fix compile on some versions of Mac OSX | |
| # See: https://github.com/neulab/xnmt/issues/199 | |
| if sys.platform == 'darwin': | |
| cflags.append('-mmacosx-version-min=10.9') | |
| else: | |
| cflags.append('-Wl,-strip-all') | |
| libs.append('-Wl,-strip-all') | |
| if sys.platform == 'linux': | |
| libs.append('-Wl,-Bsymbolic') | |
| print('## cflags={}'.format(' '.join(cflags))) | |
| print('## libs={}'.format(' '.join(libs))) | |
| ext.extra_compile_args = cflags | |
| ext.extra_link_args = libs | |
| _build_ext.build_extension(self, ext) | |
| def get_win_arch(): | |
| arch = 'win32' | |
| if sys.maxsize > 2**32: | |
| arch = 'amd64' | |
| if 'arm' in platform.machine().lower(): | |
| arch = 'arm64' | |
| if os.getenv('PYTHON_ARCH', '') == 'ARM64': | |
| # Special check for arm64 under ciwheelbuild, see https://github.com/pypa/cibuildwheel/issues/1942 | |
| arch = 'arm64' | |
| return arch | |
| if os.name == 'nt': | |
| # Must pre-install sentencepice into build directory. | |
| arch = get_win_arch() | |
| if os.path.exists('..\\build\\root_{}\\lib'.format(arch)): | |
| cflags = ['/std:c++17', '/I..\\build\\root_{}\\include'.format(arch)] | |
| libs = [ | |
| '..\\build\\root_{}\\lib\\sentencepiece.lib'.format(arch), | |
| '..\\build\\root_{}\\lib\\sentencepiece_train.lib'.format(arch), | |
| ] | |
| elif os.path.exists('..\\build\\root\\lib'): | |
| cflags = ['/std:c++17', '/I..\\build\\root\\include'] | |
| libs = [ | |
| '..\\build\\root\\lib\\sentencepiece.lib', | |
| '..\\build\\root\\lib\\sentencepiece_train.lib', | |
| ] | |
| else: | |
| # build library locally with cmake and vc++. | |
| cmake_arch = 'Win32' | |
| if arch == 'amd64': | |
| cmake_arch = 'x64' | |
| elif arch == "arm64": | |
| cmake_arch = "ARM64" | |
| subprocess.check_call([ | |
| 'cmake', | |
| 'sentencepiece', | |
| '-A', | |
| cmake_arch, | |
| '-B', | |
| 'build', | |
| '-DSPM_ENABLE_SHARED=OFF', | |
| '-DCMAKE_INSTALL_PREFIX=build\\root', | |
| ]) | |
| subprocess.check_call([ | |
| 'cmake', | |
| '--build', | |
| 'build', | |
| '--config', | |
| 'Release', | |
| '--target', | |
| 'install', | |
| '--parallel', | |
| '8', | |
| ]) | |
| cflags = ['/std:c++17', '/I.\\build\\root\\include'] | |
| libs = [ | |
| '.\\build\\root\\lib\\sentencepiece.lib', | |
| '.\\build\\root\\lib\\sentencepiece_train.lib', | |
| ] | |
| SENTENCEPIECE_EXT = Extension( | |
| 'sentencepiece._sentencepiece', | |
| sources=['src/sentencepiece/sentencepiece_wrap.cxx'], | |
| extra_compile_args=cflags, | |
| extra_link_args=libs, | |
| ) | |
| cmdclass = {} | |
| else: | |
| SENTENCEPIECE_EXT = Extension( | |
| 'sentencepiece._sentencepiece', | |
| sources=['src/sentencepiece/sentencepiece_wrap.cxx'], | |
| ) | |
| cmdclass = {'build_ext': build_ext} | |
| setup( | |
| name='sentencepiece', | |
| author='Taku Kudo', | |
| author_email='taku@google.com', | |
| description='SentencePiece python wrapper', | |
| long_description=long_description(), | |
| long_description_content_type='text/markdown', | |
| version=__version__, | |
| package_dir={'': 'src'}, | |
| url='https://github.com/google/sentencepiece', | |
| license='Apache', | |
| platforms='Unix', | |
| py_modules=[ | |
| 'sentencepiece/__init__', | |
| 'sentencepiece/_version', | |
| 'sentencepiece/sentencepiece_model_pb2', | |
| 'sentencepiece/sentencepiece_pb2', | |
| ], | |
| ext_modules=[SENTENCEPIECE_EXT], | |
| cmdclass=cmdclass, | |
| classifiers=[ | |
| 'Development Status :: 5 - Production/Stable', | |
| 'Environment :: Console', | |
| 'Intended Audience :: Developers', | |
| 'Intended Audience :: Science/Research', | |
| 'License :: OSI Approved :: Apache Software License', | |
| 'Operating System :: Unix', | |
| 'Programming Language :: Python', | |
| 'Topic :: Text Processing :: Linguistic', | |
| 'Topic :: Software Development :: Libraries :: Python Modules', | |
| ], | |
| test_suite='sentencepiece_test.suite', | |
| tests_require=['pytest'], | |
| ) | |