nsthorat-lilac commited on
Commit
9e82f79
1 Parent(s): 0c01f44

Push to HF space

Browse files
Files changed (2) hide show
  1. README.md +4 -2
  2. data/lilac.yml +73 -32
README.md CHANGED
@@ -11,9 +11,11 @@ datasets:
11
  - lilacai/lilac-glaive-function-calling-v2
12
  - lilacai/lilac-open-assistant-conversations-2
13
  - lilacai/lilac-lmsys-chat-1m
14
- - lilacai/lilac-databricks-dolly-15k-curated-en
15
  - lilacai/lilac-OpenOrca
 
 
 
 
16
  - lilacai/lilac-dolphin
17
- - lilacai/lilac-mosaic-instruct-v3
18
 
19
  ---
 
11
  - lilacai/lilac-glaive-function-calling-v2
12
  - lilacai/lilac-open-assistant-conversations-2
13
  - lilacai/lilac-lmsys-chat-1m
 
14
  - lilacai/lilac-OpenOrca
15
+ - lilacai/lilac-MMLU
16
+ - lilacai/lilac-ARC-Easy
17
+ - lilacai/lilac-ARC-Challenge
18
+ - lilacai/lilac-databricks-dolly-15k-curated-en
19
  - lilacai/lilac-dolphin
 
20
 
21
  ---
data/lilac.yml CHANGED
@@ -98,6 +98,67 @@ datasets:
98
  - content
99
  tags:
100
  - logs
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
101
  - namespace: lilac
102
  name: databricks-dolly-15k-curated-en
103
  source:
@@ -127,21 +188,6 @@ datasets:
127
  - '*'
128
  tags:
129
  - machine-learning
130
- - namespace: lilac
131
- name: OpenOrca
132
- source:
133
- dataset_name: Open-Orca/OpenOrca
134
- source_name: huggingface
135
- embeddings:
136
- - path: question
137
- embedding: gte-small
138
- settings:
139
- ui:
140
- media_paths:
141
- - question
142
- - response
143
- tags:
144
- - datasets
145
  - namespace: lilac
146
  name: dolphin
147
  tags:
@@ -159,19 +205,6 @@ datasets:
159
  - - input__cluster
160
  - text
161
  markdown_paths: []
162
- - namespace: lilac
163
- name: mosaic-instruct-v3
164
- tags:
165
- - datasets
166
- source:
167
- dataset_name: mosaicml/instruct-v3
168
- source_name: huggingface
169
- settings:
170
- ui:
171
- media_paths:
172
- - prompt
173
- - response
174
- markdown_paths: []
175
  use_garden: true
176
  signals:
177
  - signal_name: text_statistics
@@ -220,10 +253,18 @@ clusters:
220
  input_path: !!python/tuple
221
  - original-instruction
222
  - dataset_namespace: lilac
223
- dataset_name: dolphin
224
  input_path: !!python/tuple
225
- - input
 
 
 
 
226
  - dataset_namespace: lilac
227
- dataset_name: mosaic-instruct-v3
228
  input_path: !!python/tuple
229
- - prompt
 
 
 
 
 
98
  - content
99
  tags:
100
  - logs
101
+ - namespace: lilac
102
+ name: OpenOrca
103
+ source:
104
+ dataset_name: Open-Orca/OpenOrca
105
+ source_name: huggingface
106
+ embeddings:
107
+ - path: question
108
+ embedding: gte-small
109
+ settings:
110
+ ui:
111
+ media_paths:
112
+ - question
113
+ - response
114
+ tags:
115
+ - datasets
116
+ - namespace: lilac
117
+ name: MMLU
118
+ source:
119
+ dataset_name: cais/mmlu
120
+ config_name: all
121
+ source_name: huggingface
122
+ settings:
123
+ ui:
124
+ media_paths:
125
+ - question
126
+ - - choices
127
+ - '*'
128
+ - answer
129
+ markdown_paths: []
130
+ tags:
131
+ - eval
132
+ - namespace: lilac
133
+ name: ARC-Easy
134
+ source:
135
+ dataset_name: allenai/ai2_arc
136
+ config_name: ARC-Easy
137
+ source_name: huggingface
138
+ settings:
139
+ ui:
140
+ media_paths:
141
+ - question
142
+ - - choices
143
+ - text
144
+ - '*'
145
+ - answerKey
146
+ markdown_paths: []
147
+ - namespace: lilac
148
+ name: ARC-Challenge
149
+ source:
150
+ dataset_name: allenai/ai2_arc
151
+ config_name: ARC-Challenge
152
+ source_name: huggingface
153
+ settings:
154
+ ui:
155
+ media_paths:
156
+ - question
157
+ - - choices
158
+ - text
159
+ - '*'
160
+ - answerKey
161
+ markdown_paths: []
162
  - namespace: lilac
163
  name: databricks-dolly-15k-curated-en
164
  source:
 
188
  - '*'
189
  tags:
190
  - machine-learning
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
191
  - namespace: lilac
192
  name: dolphin
193
  tags:
 
205
  - - input__cluster
206
  - text
207
  markdown_paths: []
 
 
 
 
 
 
 
 
 
 
 
 
 
208
  use_garden: true
209
  signals:
210
  - signal_name: text_statistics
 
253
  input_path: !!python/tuple
254
  - original-instruction
255
  - dataset_namespace: lilac
256
+ dataset_name: MMLU
257
  input_path: !!python/tuple
258
+ - question
259
+ - dataset_namespace: lilac
260
+ dataset_name: ARC-Easy
261
+ input_path: !!python/tuple
262
+ - question
263
  - dataset_namespace: lilac
264
+ dataset_name: ARC-Challenge
265
  input_path: !!python/tuple
266
+ - question
267
+ - dataset_namespace: lilac
268
+ dataset_name: dolphin
269
+ input_path: !!python/tuple
270
+ - input