-
Notifications
You must be signed in to change notification settings - Fork 5
/
pyproject.toml
133 lines (122 loc) · 3.68 KB
/
pyproject.toml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
[tool.poetry]
name = "kwja"
version = "2.4.0"
description = "A unified Japanese analyzer based on foundation models"
authors = [
"Hirokazu Kiyomaru <[email protected]>",
"Nobuhiro Ueda <[email protected]>",
"Kazumasa Omura <[email protected]>",
"Takashi Kodama <[email protected]>",
"Yugo Murawaki <[email protected]>",
"Daisuke Kawahara <[email protected]>",
"Sadao Kurohashi <[email protected]>"
]
maintainers = [
"Hirokazu Kiyomaru <[email protected]>",
"Nobuhiro Ueda <[email protected]>",
"Kazumasa Omura <[email protected]>",
"Takashi Kodama <[email protected]>",
"Yugo Murawaki <[email protected]>"
]
license = "MIT"
readme = "README.md"
repository = "https://github.com/ku-nlp/kwja"
keywords = ["NLP", "japanese"]
classifiers = [
"Environment :: GPU",
"Environment :: MacOS X",
"Natural Language :: Japanese",
"Programming Language :: Python :: 3",
"Programming Language :: Python :: 3.8",
"Programming Language :: Python :: 3.9",
"Programming Language :: Python :: 3.10",
"Programming Language :: Python :: 3.11",
"Programming Language :: Python :: 3.12",
"Topic :: Scientific/Engineering",
"Topic :: Text Processing",
]
packages = [
{ include = "kwja", from = "src" }
]
include = [
"kwja/resource/**/*"
]
exclude = [
"src/kwja/metrics/**/*"
]
[tool.poetry.dependencies]
python = ">=3.8,<3.13"
torch = ">=1.11,!=2.0.1,!=2.1.0" # https://github.com/pytorch/pytorch/issues/100974ypmun
numpy = [
{ version = "~1.24.4", python = "<3.9" },
{ version = ">=1.26,<2.0", python = ">=3.9" },
]
transformers = { version = "~4.42.2", extras = ["sentencepiece"] }
tokenizers = "^0.19.1"
pytorch-lightning = "~2.3.3" # As "lightning" comes with many extra dependencies, we stay with "pytorch-lightning"
omegaconf = "^2.1"
hydra-core = "^1.2"
rhoknp = "^1.6.0"
typer-slim = "^0.12.3"
jinf = "^1.0.4"
pure-cdb = "^4.0"
rich = ">=12.4"
pyyaml = "^6.0"
regex = ">=2024.7.24"
cohesion-tools = "^0.5.7"
importlib-resources = { version = "^6.0", python = "<3.9" }
[tool.poetry.group.dev.dependencies]
torchmetrics = "^1.0"
seqeval = "^1.2"
scikit-learn = [
{ version = "^1.3", python = "<3.9" },
{ version = "^1.4", python = ">=3.9" },
]
Levenshtein = ">=0.21.0"
cohesion-tools = { version = "^0.5.7", extras = ["eval"] }
python-dotenv = "^1.0"
jaconv = "^0.3.4"
ipython = [
{ version = "~8.12.1", python = "<3.9" },
{ version = "^8.13", python = ">=3.9" },
]
ipdb = "^0.13.13"
types-attrs = "^19.1"
types-pyyaml = "^6.0.12.9"
wandb = "^0.17.5"
[tool.poetry.group.test.dependencies]
torchmetrics = "^1.0"
seqeval = "^1.2"
Levenshtein = ">=0.21.0"
pandas = "^2.0"
jaconv = "^0.3.4"
pytest = "^8.0"
pytest-cov = "^5.0"
pytest-profiling = "^1.7"
[tool.poetry.scripts]
kwja = "kwja.cli.cli:app"
[tool.black]
line-length = 120
target-version = ["py38", "py39", "py310", "py311"]
[tool.isort]
line_length = 120
py_version = 39
profile = "black"
src_paths = ["src"]
[tool.flake8]
# E203 is not PEP8 compliant and black insert space around slice (https://black.readthedocs.io/en/stable/faq.html#why-are-flake8-s-e203-and-w503-violated)
# E501: Line too long. Disable it to allow long lines of comments and print lines which black allows.
# W503: line break before binary operator (https://www.flake8rules.com/rules/W503.html)
ignore = ["E203", "E501", "W503"]
max-line-length = 120
[tool.mypy]
python_version = 3.8
[tool.pytest.ini_options]
testpaths = ["tests"]
filterwarnings = [
# note the use of single quote below to denote "raw" strings in TOML
'ignore::UserWarning',
]
[build-system]
requires = ["poetry-core"]
build-backend = "poetry.core.masonry.api"