-
Notifications
You must be signed in to change notification settings - Fork 2
/
vllm.yml
151 lines (151 loc) · 3.95 KB
/
vllm.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
name: vllm
channels:
- defaults
dependencies:
- _libgcc_mutex=0.1=main
- _openmp_mutex=5.1=1_gnu
- ca-certificates=2024.3.11=h06a4308_0
- ld_impl_linux-64=2.38=h1181459_1
- libffi=3.4.4=h6a678d5_1
- libgcc-ng=11.2.0=h1234567_1
- libgomp=11.2.0=h1234567_1
- libstdcxx-ng=11.2.0=h1234567_1
- ncurses=6.4=h6a678d5_0
- openssl=3.0.14=h5eee18b_0
- pip=24.0=py39h06a4308_0
- python=3.9.19=h955ad1f_1
- readline=8.2=h5eee18b_0
- setuptools=69.5.1=py39h06a4308_0
- sqlite=3.45.3=h5eee18b_0
- tk=8.6.14=h39e8969_0
- wheel=0.43.0=py39h06a4308_0
- xz=5.4.6=h5eee18b_1
- zlib=1.2.13=h5eee18b_1
- pip:
- aiohttp==3.9.5
- aiosignal==1.3.1
- annotated-types==0.7.0
- anyio==4.4.0
- async-timeout==4.0.3
- attrs==23.2.0
- certifi==2024.7.4
- charset-normalizer==3.3.2
- click==8.1.7
- cloudpickle==3.0.0
- cmake==3.30.0
- contourpy==1.3.0
- cycler==0.12.1
- datasets==2.20.0
- dill==0.3.8
- diskcache==5.6.3
- distro==1.9.0
- dnspython==2.6.1
- email-validator==2.2.0
- exceptiongroup==1.2.1
- fastapi==0.111.0
- fastapi-cli==0.0.4
- filelock==3.15.4
- fonttools==4.53.1
- frozenlist==1.4.1
- fsspec==2024.5.0
- h11==0.14.0
- httpcore==1.0.5
- httptools==0.6.1
- httpx==0.27.0
- huggingface-hub==0.23.4
- idna==3.7
- importlib-resources==6.4.4
- interegular==0.3.3
- jinja2==3.1.4
- jsonschema==4.23.0
- jsonschema-specifications==2023.12.1
- kiwisolver==1.4.5
- lark==1.1.9
- llvmlite==0.43.0
- lm-format-enforcer==0.10.1
- markdown-it-py==3.0.0
- markupsafe==2.1.5
- matplotlib==3.9.2
- mdurl==0.1.2
- mpmath==1.3.0
- msgpack==1.0.8
- multidict==6.0.5
- multiprocess==0.70.16
- nest-asyncio==1.6.0
- networkx==3.2.1
- ninja==1.11.1.1
- numba==0.60.0
- numpy==1.26.4
- nvidia-cublas-cu12==12.1.3.1
- nvidia-cuda-cupti-cu12==12.1.105
- nvidia-cuda-nvrtc-cu12==12.1.105
- nvidia-cuda-runtime-cu12==12.1.105
- nvidia-cudnn-cu12==8.9.2.26
- nvidia-cufft-cu12==11.0.2.54
- nvidia-curand-cu12==10.3.2.106
- nvidia-cusolver-cu12==11.4.5.107
- nvidia-cusparse-cu12==12.1.0.106
- nvidia-ml-py==12.555.43
- nvidia-nccl-cu12==2.20.5
- nvidia-nvjitlink-cu12==12.5.82
- nvidia-nvtx-cu12==12.1.105
- openai==1.35.13
- orjson==3.10.6
- outlines==0.0.46
- packaging==24.1
- pandas==2.2.2
- pillow==10.4.0
- prometheus-client==0.20.0
- prometheus-fastapi-instrumentator==7.0.0
- protobuf==5.27.2
- psutil==6.0.0
- py-cpuinfo==9.0.0
- pyairports==2.1.1
- pyarrow==16.1.0
- pyarrow-hotfix==0.6
- pycountry==24.6.1
- pydantic==2.8.2
- pydantic-core==2.20.1
- pygments==2.18.0
- pyparsing==3.1.4
- python-dateutil==2.9.0.post0
- python-dotenv==1.0.1
- python-multipart==0.0.9
- pytz==2024.1
- pyyaml==6.0.1
- ray==2.32.0
- referencing==0.35.1
- regex==2024.5.15
- requests==2.32.3
- rich==13.7.1
- rpds-py==0.19.0
- safetensors==0.4.3
- seaborn==0.13.2
- sentencepiece==0.2.0
- shellingham==1.5.4
- six==1.16.0
- sniffio==1.3.1
- starlette==0.37.2
- sympy==1.13.0
- tiktoken==0.7.0
- tokenizers==0.19.1
- torch==2.3.0
- torchvision==0.18.0
- tqdm==4.66.4
- transformers==4.42.4
- triton==2.3.0
- typer==0.12.3
- typing-extensions==4.12.2
- tzdata==2024.1
- ujson==5.10.0
- urllib3==2.2.2
- uvicorn==0.30.1
- uvloop==0.19.0
- vllm==0.5.1
- vllm-flash-attn==2.5.9
- watchfiles==0.22.0
- websockets==12.0
- xformers==0.0.26.post1
- xxhash==3.4.1
- yarl==1.9.4
- zipp==3.20.1