This repository has been archived by the owner on Apr 15, 2024. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 1.1k
/
setup.py
74 lines (70 loc) · 2.21 KB
/
setup.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
#!/usr/bin/env python
from setuptools import setup
from setuptools.command.install import install
from pdfminer import __version__
class install_cmap(install):
def run(self):
import os.path
import pdfminer
from pdfminer.cmapdb import convert_cmap
outdir = os.path.join(os.path.join(self.install_lib, 'pdfminer'), 'cmap')
print('installing cmap: %r...' % outdir)
os.makedirs(outdir, exist_ok=True)
convert_cmap(
outdir, 'Adobe-CNS1',
{'B5':'cp950', 'UniCNS-UTF8':'utf-8'},
['cmaprsrc/cid2code_Adobe_CNS1.txt'])
convert_cmap(
outdir, 'Adobe-GB1',
{'GBK-EUC':'cp936', 'UniGB-UTF8':'utf-8'},
['cmaprsrc/cid2code_Adobe_GB1.txt'])
convert_cmap(
outdir, 'Adobe-Japan1',
{'RKSJ':'cp932', 'EUC':'euc-jp', 'UniJIS-UTF8':'utf-8'},
['cmaprsrc/cid2code_Adobe_Japan1.txt'])
convert_cmap(
outdir, 'Adobe-Korea1',
{'KSC-EUC':'euc-kr', 'KSC-Johab':'johab', 'KSCms-UHC':'cp949',
'UniKS-UTF8':'utf-8'},
['cmaprsrc/cid2code_Adobe_Korea1.txt'])
install.run(self)
return
with open('README.md') as fp:
long_description = fp.read()
setup(
cmdclass = { 'install': install_cmap },
name = 'pdfminer',
version = __version__,
description = 'PDF parser and analyzer',
long_description = long_description,
long_description_content_type = 'text/markdown',
license = 'MIT',
author = 'Yusuke Shinyama',
author_email = '[email protected]',
url = 'http://github.com/euske/pdfminer',
packages = [
'pdfminer',
],
python_requires = '>=3.6',
install_requires = [
'pycryptodome',
],
scripts = [
'tools/pdf2txt.py',
'tools/dumppdf.py',
],
keywords = [
'pdf parser',
'pdf converter',
'layout analysis',
'text mining'
],
classifiers = [
'Development Status :: 4 - Beta',
'Environment :: Console',
'Intended Audience :: Developers',
'Intended Audience :: Science/Research',
'License :: OSI Approved :: MIT License',
'Topic :: Text Processing',
],
)