nsthorat-lilac commited on
Commit
ab92d61
1 Parent(s): e6289f2

Push to HF space

Browse files
Files changed (2) hide show
  1. README.md +1 -0
  2. data/lilac.yml +18 -3
README.md CHANGED
@@ -12,6 +12,7 @@ datasets:
12
  - lilacai/lilac-open-assistant-conversations-2
13
  - lilacai/lilac-lmsys-chat-1m
14
  - lilacai/lilac-OpenOrca
 
15
  - lilacai/lilac-SlimOrca
16
  - lilacai/lilac-UltraChat-200k
17
  - lilacai/lilac-roblox_luau_corpus
 
12
  - lilacai/lilac-open-assistant-conversations-2
13
  - lilacai/lilac-lmsys-chat-1m
14
  - lilacai/lilac-OpenOrca
15
+ - lilacai/lilac-OpenHermes-2.5
16
  - lilacai/lilac-SlimOrca
17
  - lilacai/lilac-UltraChat-200k
18
  - lilacai/lilac-roblox_luau_corpus
data/lilac.yml CHANGED
@@ -110,6 +110,17 @@ datasets:
110
  - response
111
  tags:
112
  - datasets
 
 
 
 
 
 
 
 
 
 
 
113
  - namespace: lilac
114
  name: SlimOrca
115
  source:
@@ -399,9 +410,6 @@ datasets:
399
  tags:
400
  - datasets
401
  use_garden: true
402
- signals:
403
- - signal_name: text_statistics
404
- - signal_name: lang_detection
405
  concept_model_cache_embeddings:
406
  - gte-small
407
  - gte-base
@@ -441,6 +449,13 @@ clusters:
441
  dataset_name: OpenOrca
442
  input_path: !!python/tuple
443
  - question
 
 
 
 
 
 
 
444
  - dataset_namespace: lilac
445
  dataset_name: SlimOrca
446
  input_selector:
 
110
  - response
111
  tags:
112
  - datasets
113
+ - namespace: lilac
114
+ name: OpenHermes-2.5
115
+ source:
116
+ dataset_name: teknium/OpenHermes-2.5
117
+ source_name: huggingface
118
+ settings:
119
+ ui:
120
+ media_paths:
121
+ - - conversations
122
+ - '*'
123
+ - value
124
  - namespace: lilac
125
  name: SlimOrca
126
  source:
 
410
  tags:
411
  - datasets
412
  use_garden: true
 
 
 
413
  concept_model_cache_embeddings:
414
  - gte-small
415
  - gte-base
 
449
  dataset_name: OpenOrca
450
  input_path: !!python/tuple
451
  - question
452
+ - dataset_namespace: lilac
453
+ dataset_name: OpenHermes-2.5
454
+ input_selector:
455
+ format: sharegpt
456
+ selector: human
457
+ output_path: !!python/tuple
458
+ - conversations__clusters
459
  - dataset_namespace: lilac
460
  dataset_name: SlimOrca
461
  input_selector: