forked from WojciechMula/pyahocorasick
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathsetup.py
129 lines (115 loc) · 3.95 KB
/
setup.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
# -*- coding: utf-8 -*-
"""
Aho-Corasick string search algorithm.
Author : Wojciech Muła, [email protected]
WWW : http://0x80.pl
License : BSD-3-Clause (see LICENSE)
"""
import os
from setuptools import setup
from setuptools import Extension
# check for presence of environment variables
build_as_bytes = "AHOCORASICK_BYTES" in os.environ
build_as_unicode = "AHOCORASICK_UNICODE" in os.environ
if build_as_unicode and build_as_bytes:
raise Exception(
"Cannot build pyahocorasick both as bytes and unicode: "
"only one of AHOCORASICK_UNICODE and AHOCORASICK_BYTES environment "
"variable should be set."
)
# we default to unicode
elif not build_as_unicode and not build_as_bytes:
build_as_unicode = True
if build_as_unicode:
macros = [("AHOCORASICK_UNICODE", "")]
else:
macros = []
def get_long_description():
import io
with io.open("README.rst", encoding="UTF-8") as f:
return f.read()
module = Extension(
"ahocorasick",
sources=[
"src/pyahocorasick.c",
],
define_macros=macros,
depends=[
"src/common.h",
"src/Automaton.c",
"src/Automaton.h",
"src/Automaton_pickle.c",
"src/AutomatonItemsIter.c",
"src/AutomatonItemsIter.h",
"src/AutomatonSearchIter.c",
"src/AutomatonSearchIter.h",
"src/AutomatonSearchIterLong.c",
"src/AutomatonSearchIterLong.h",
"src/trie.c",
"src/trie.h",
"src/slist.c",
"src/utils.c",
"src/trienode.c",
"src/trienode.h",
"src/msinttypes/stdint.h",
"src/inline_doc.h",
"src/pickle/pickle.h",
"src/pickle/pickle_data.h",
"src/pickle/pickle_data.c",
"src/custompickle/custompickle.h",
"src/custompickle/custompickle.c",
"src/custompickle/pyhelpers.h",
"src/custompickle/pyhelpers.c",
"src/custompickle/save/automaton_save.h",
"src/custompickle/save/automaton_save.c",
"src/custompickle/save/savebuffer.h",
"src/custompickle/save/savebuffer.c",
"src/custompickle/load/module_automaton_load.h",
"src/custompickle/load/module_automaton_load.c",
"src/custompickle/load/loadbuffer.h",
"src/custompickle/load/loadbuffer.c",
"src/pycallfault/pycallfault.h",
"src/pycallfault/pycallfault.c",
],
)
setup(
name="pyahocorasick",
version="2.0.0b1",
ext_modules=[module],
description=(
"pyahocorasick is a fast and memory efficient library for exact or "
"approximate multi-pattern string search. With the ``ahocorasick.Automaton`` "
"class, you can find multiple key string occurrences at once in some input "
"text. You can use it as a plain dict-like Trie or convert a Trie to an "
"automaton for efficient Aho-Corasick search. And pickle to disk for easy "
"reuse of large automatons. Implemented in C and tested on Python 3.6+. "
"Works on Linux, macOS and Windows. BSD-3-Cause license."
),
author="Wojciech Muła",
author_email="[email protected]",
maintainer="Wojciech Muła",
maintainer_email="[email protected]",
url="http://github.com/WojciechMula/pyahocorasick",
platforms=["Linux", "MacOSX", "Windows"],
license=" BSD-3-Clause and Public-Domain",
long_description=get_long_description(),
long_description_content_type="text/x-rst",
keywords=[
"aho-corasick",
"trie",
"automaton",
"dictionary",
],
classifiers=[
"Development Status :: 5 - Production/Stable",
"License :: OSI Approved :: BSD License",
"Programming Language :: C",
"Programming Language :: Python :: 3",
"Topic :: Software Development :: Libraries",
"Topic :: Text Editors :: Text Processing",
],
extras_require={
"testing": ["pytest", "twine", "setuptools", "wheel", ],
},
python_requires=">=3.6",
)