-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathsetup.py
37 lines (36 loc) · 1.17 KB
/
setup.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
from setuptools import setup
setup(
name='datatools-py',
version='0.1',
packages=['datatools'],
install_requires=[
'tqdm>=4.66.1',
'numpy>=1.26.4',
'simple_parsing>=0.1.5',
'mosaicml-streaming>=0.7.5',
'datasets>=2.18.0',
'sentencepiece>=0.1.99',
'zstandard>=0.23.0'
# 'transformers==4.39.3',
],
author='Alexander Wettig',
description='Library and scripts for common LM data utilities (tokenizing, splitting, packing, ...)',
long_description=open('README.md').read(),
long_description_content_type='text/markdown',
url='https://github.com/CodeCreator/datatools',
classifiers=[
'Programming Language :: Python :: 3',
'License :: OSI Approved :: MIT License',
'Operating System :: OS Independent',
],
entry_points={
'console_scripts': [
'peek=datatools.scripts.peek:main',
'merge_index=datatools.scripts.merge_index:main',
'pack=datatools.scripts.pack:main',
'wrangle=datatools.scripts.wrangle:main',
'tokenize=datatools.scripts.tokenize:main',
]
},
python_requires='>=3.6',
)