hysts HF staff commited on
Commit
e12dd90
·
1 Parent(s): cadad8a
Files changed (3) hide show
  1. README.md +1 -1
  2. app.py +3 -3
  3. requirements.txt +263 -8
README.md CHANGED
@@ -4,7 +4,7 @@ emoji: 🦙
4
  colorFrom: indigo
5
  colorTo: pink
6
  sdk: gradio
7
- sdk_version: 4.39.0
8
  app_file: app.py
9
  pinned: false
10
  license: other
 
4
  colorFrom: indigo
5
  colorTo: pink
6
  sdk: gradio
7
+ sdk_version: 4.44.0
8
  app_file: app.py
9
  pinned: false
10
  license: other
app.py CHANGED
@@ -45,7 +45,7 @@ if torch.cuda.is_available():
45
  @spaces.GPU
46
  def generate(
47
  message: str,
48
- chat_history: list[tuple[str, str]],
49
  system_prompt: str,
50
  max_new_tokens: int = 1024,
51
  temperature: float = 0.6,
@@ -56,8 +56,7 @@ def generate(
56
  conversation = []
57
  if system_prompt:
58
  conversation.append({"role": "system", "content": system_prompt})
59
- for user, assistant in chat_history:
60
- conversation.extend([{"role": "user", "content": user}, {"role": "assistant", "content": assistant}])
61
  conversation.append({"role": "user", "content": message})
62
 
63
  input_ids = tokenizer.apply_chat_template(conversation, return_tensors="pt")
@@ -136,6 +135,7 @@ chat_interface = gr.ChatInterface(
136
  ["Write a 100-word article on 'Benefits of Open-Source in AI research'"],
137
  ],
138
  cache_examples=False,
 
139
  )
140
 
141
  with gr.Blocks(css="style.css", fill_height=True) as demo:
 
45
  @spaces.GPU
46
  def generate(
47
  message: str,
48
+ chat_history: list[dict],
49
  system_prompt: str,
50
  max_new_tokens: int = 1024,
51
  temperature: float = 0.6,
 
56
  conversation = []
57
  if system_prompt:
58
  conversation.append({"role": "system", "content": system_prompt})
59
+ conversation += chat_history
 
60
  conversation.append({"role": "user", "content": message})
61
 
62
  input_ids = tokenizer.apply_chat_template(conversation, return_tensors="pt")
 
135
  ["Write a 100-word article on 'Benefits of Open-Source in AI research'"],
136
  ],
137
  cache_examples=False,
138
+ type="messages",
139
  )
140
 
141
  with gr.Blocks(css="style.css", fill_height=True) as demo:
requirements.txt CHANGED
@@ -1,8 +1,263 @@
1
- accelerate==0.30.1
2
- bitsandbytes==0.43.1
3
- gradio==4.36.1
4
- scipy==1.13.0
5
- sentencepiece==0.2.0
6
- spaces==0.28.3
7
- torch==2.0.0
8
- transformers==4.41.0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # This file was autogenerated by uv via the following command:
2
+ # uv pip compile pyproject.toml -o requirements.txt
3
+ accelerate==0.34.2
4
+ # via llama-2-13b-chat (pyproject.toml)
5
+ aiofiles==23.2.1
6
+ # via gradio
7
+ annotated-types==0.7.0
8
+ # via pydantic
9
+ anyio==4.6.0
10
+ # via
11
+ # gradio
12
+ # httpx
13
+ # starlette
14
+ bitsandbytes==0.44.0
15
+ # via llama-2-13b-chat (pyproject.toml)
16
+ certifi==2024.8.30
17
+ # via
18
+ # httpcore
19
+ # httpx
20
+ # requests
21
+ charset-normalizer==3.3.2
22
+ # via requests
23
+ click==8.1.7
24
+ # via
25
+ # typer
26
+ # uvicorn
27
+ contourpy==1.3.0
28
+ # via matplotlib
29
+ cycler==0.12.1
30
+ # via matplotlib
31
+ exceptiongroup==1.2.2
32
+ # via anyio
33
+ fastapi==0.115.0
34
+ # via gradio
35
+ ffmpy==0.4.0
36
+ # via gradio
37
+ filelock==3.16.1
38
+ # via
39
+ # huggingface-hub
40
+ # torch
41
+ # transformers
42
+ # triton
43
+ fonttools==4.54.1
44
+ # via matplotlib
45
+ fsspec==2024.9.0
46
+ # via
47
+ # gradio-client
48
+ # huggingface-hub
49
+ # torch
50
+ gradio==4.44.0
51
+ # via
52
+ # llama-2-13b-chat (pyproject.toml)
53
+ # spaces
54
+ gradio-client==1.3.0
55
+ # via gradio
56
+ h11==0.14.0
57
+ # via
58
+ # httpcore
59
+ # uvicorn
60
+ hf-transfer==0.1.8
61
+ # via llama-2-13b-chat (pyproject.toml)
62
+ httpcore==1.0.5
63
+ # via httpx
64
+ httpx==0.27.2
65
+ # via
66
+ # gradio
67
+ # gradio-client
68
+ # spaces
69
+ huggingface-hub==0.25.1
70
+ # via
71
+ # accelerate
72
+ # gradio
73
+ # gradio-client
74
+ # tokenizers
75
+ # transformers
76
+ idna==3.10
77
+ # via
78
+ # anyio
79
+ # httpx
80
+ # requests
81
+ importlib-resources==6.4.5
82
+ # via gradio
83
+ jinja2==3.1.4
84
+ # via
85
+ # gradio
86
+ # torch
87
+ kiwisolver==1.4.7
88
+ # via matplotlib
89
+ markdown-it-py==3.0.0
90
+ # via rich
91
+ markupsafe==2.1.5
92
+ # via
93
+ # gradio
94
+ # jinja2
95
+ matplotlib==3.9.2
96
+ # via gradio
97
+ mdurl==0.1.2
98
+ # via markdown-it-py
99
+ mpmath==1.3.0
100
+ # via sympy
101
+ networkx==3.3
102
+ # via torch
103
+ numpy==2.1.1
104
+ # via
105
+ # accelerate
106
+ # bitsandbytes
107
+ # contourpy
108
+ # gradio
109
+ # matplotlib
110
+ # pandas
111
+ # transformers
112
+ nvidia-cublas-cu12==12.1.3.1
113
+ # via
114
+ # nvidia-cudnn-cu12
115
+ # nvidia-cusolver-cu12
116
+ # torch
117
+ nvidia-cuda-cupti-cu12==12.1.105
118
+ # via torch
119
+ nvidia-cuda-nvrtc-cu12==12.1.105
120
+ # via torch
121
+ nvidia-cuda-runtime-cu12==12.1.105
122
+ # via torch
123
+ nvidia-cudnn-cu12==9.1.0.70
124
+ # via torch
125
+ nvidia-cufft-cu12==11.0.2.54
126
+ # via torch
127
+ nvidia-curand-cu12==10.3.2.106
128
+ # via torch
129
+ nvidia-cusolver-cu12==11.4.5.107
130
+ # via torch
131
+ nvidia-cusparse-cu12==12.1.0.106
132
+ # via
133
+ # nvidia-cusolver-cu12
134
+ # torch
135
+ nvidia-nccl-cu12==2.20.5
136
+ # via torch
137
+ nvidia-nvjitlink-cu12==12.6.68
138
+ # via
139
+ # nvidia-cusolver-cu12
140
+ # nvidia-cusparse-cu12
141
+ nvidia-nvtx-cu12==12.1.105
142
+ # via torch
143
+ orjson==3.10.7
144
+ # via gradio
145
+ packaging==24.1
146
+ # via
147
+ # accelerate
148
+ # gradio
149
+ # gradio-client
150
+ # huggingface-hub
151
+ # matplotlib
152
+ # spaces
153
+ # transformers
154
+ pandas==2.2.3
155
+ # via gradio
156
+ pillow==10.4.0
157
+ # via
158
+ # gradio
159
+ # matplotlib
160
+ psutil==5.9.8
161
+ # via
162
+ # accelerate
163
+ # spaces
164
+ pydantic==2.9.2
165
+ # via
166
+ # fastapi
167
+ # gradio
168
+ # spaces
169
+ pydantic-core==2.23.4
170
+ # via pydantic
171
+ pydub==0.25.1
172
+ # via gradio
173
+ pygments==2.18.0
174
+ # via rich
175
+ pyparsing==3.1.4
176
+ # via matplotlib
177
+ python-dateutil==2.9.0.post0
178
+ # via
179
+ # matplotlib
180
+ # pandas
181
+ python-multipart==0.0.12
182
+ # via gradio
183
+ pytz==2024.2
184
+ # via pandas
185
+ pyyaml==6.0.2
186
+ # via
187
+ # accelerate
188
+ # gradio
189
+ # huggingface-hub
190
+ # transformers
191
+ regex==2024.9.11
192
+ # via transformers
193
+ requests==2.32.3
194
+ # via
195
+ # huggingface-hub
196
+ # spaces
197
+ # transformers
198
+ rich==13.8.1
199
+ # via typer
200
+ ruff==0.6.8
201
+ # via gradio
202
+ safetensors==0.4.5
203
+ # via
204
+ # accelerate
205
+ # transformers
206
+ semantic-version==2.10.0
207
+ # via gradio
208
+ shellingham==1.5.4
209
+ # via typer
210
+ six==1.16.0
211
+ # via python-dateutil
212
+ sniffio==1.3.1
213
+ # via
214
+ # anyio
215
+ # httpx
216
+ spaces==0.30.2
217
+ # via llama-2-13b-chat (pyproject.toml)
218
+ starlette==0.38.6
219
+ # via fastapi
220
+ sympy==1.13.3
221
+ # via torch
222
+ tokenizers==0.20.0
223
+ # via transformers
224
+ tomlkit==0.12.0
225
+ # via gradio
226
+ torch==2.4.0
227
+ # via
228
+ # llama-2-13b-chat (pyproject.toml)
229
+ # accelerate
230
+ # bitsandbytes
231
+ tqdm==4.66.5
232
+ # via
233
+ # huggingface-hub
234
+ # transformers
235
+ transformers==4.45.1
236
+ # via llama-2-13b-chat (pyproject.toml)
237
+ triton==3.0.0
238
+ # via torch
239
+ typer==0.12.5
240
+ # via gradio
241
+ typing-extensions==4.12.2
242
+ # via
243
+ # anyio
244
+ # fastapi
245
+ # gradio
246
+ # gradio-client
247
+ # huggingface-hub
248
+ # pydantic
249
+ # pydantic-core
250
+ # spaces
251
+ # torch
252
+ # typer
253
+ # uvicorn
254
+ tzdata==2024.2
255
+ # via pandas
256
+ urllib3==2.2.3
257
+ # via
258
+ # gradio
259
+ # requests
260
+ uvicorn==0.31.0
261
+ # via gradio
262
+ websockets==12.0
263
+ # via gradio-client