forked from mit-han-lab/llm-awq
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathpyproject.toml
31 lines (28 loc) · 848 Bytes
/
pyproject.toml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
[build-system]
requires = ["setuptools>=61.0"]
build-backend = "setuptools.build_meta"
[project]
name = "awq"
version = "0.1.0"
description = "An efficient and accurate low-bit weight quantization(INT3/4) method for LLMs."
readme = "README.md"
requires-python = ">=3.8"
classifiers = [
"Programming Language :: Python :: 3",
"License :: OSI Approved :: Apache Software License",
]
dependencies = [
"accelerate", "sentencepiece", "tokenizers>=0.12.1",
"torch>=2.0.0", "torchvision",
"transformers==4.37.2",
"lm_eval==0.3.0", "texttable",
"toml", "attributedict",
"protobuf",
"gradio==3.35.2", "gradio_client==0.2.9",
"fastapi", "uvicorn",
"pydantic==2.9.2"
]
[tool.setuptools.packages.find]
exclude = ["results*", "scripts*", "examples*"]
[tool.wheel]
exclude = ["results*", "scripts*", "examples*"]