nsthorat commited on
Commit
b1494e2
1 Parent(s): f1ca8ba
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +0 -21
  2. data/.cache/lilac/concept/lilac/legal-termination/cohere.pkl +0 -0
  3. data/.cache/lilac/concept/lilac/legal-termination/gte-base.pkl +0 -0
  4. data/.cache/lilac/concept/lilac/legal-termination/gte-small.pkl +0 -0
  5. data/.cache/lilac/concept/lilac/legal-termination/openai.pkl +0 -0
  6. data/.cache/lilac/concept/lilac/legal-termination/palm.pkl +0 -0
  7. data/.cache/lilac/concept/lilac/legal-termination/sbert.pkl +0 -0
  8. data/.cache/lilac/concept/lilac/negative-sentiment/cohere.pkl +0 -3
  9. data/.cache/lilac/concept/lilac/negative-sentiment/gte-base.pkl +0 -0
  10. data/.cache/lilac/concept/lilac/negative-sentiment/gte-small.pkl +0 -0
  11. data/.cache/lilac/concept/lilac/negative-sentiment/openai.pkl +0 -0
  12. data/.cache/lilac/concept/lilac/negative-sentiment/palm.pkl +0 -0
  13. data/.cache/lilac/concept/lilac/negative-sentiment/sbert.pkl +0 -0
  14. data/.cache/lilac/concept/lilac/non-english/cohere.pkl +0 -3
  15. data/.cache/lilac/concept/lilac/non-english/gte-base.pkl +0 -0
  16. data/.cache/lilac/concept/lilac/non-english/gte-small.pkl +0 -0
  17. data/.cache/lilac/concept/lilac/non-english/openai.pkl +0 -3
  18. data/.cache/lilac/concept/lilac/non-english/palm.pkl +0 -0
  19. data/.cache/lilac/concept/lilac/non-english/sbert.pkl +0 -0
  20. data/.cache/lilac/concept/lilac/positive-sentiment/cohere.pkl +0 -3
  21. data/.cache/lilac/concept/lilac/positive-sentiment/gte-base.pkl +0 -0
  22. data/.cache/lilac/concept/lilac/positive-sentiment/gte-small.pkl +0 -0
  23. data/.cache/lilac/concept/lilac/positive-sentiment/openai.pkl +0 -0
  24. data/.cache/lilac/concept/lilac/positive-sentiment/palm.pkl +0 -0
  25. data/.cache/lilac/concept/lilac/positive-sentiment/sbert.pkl +0 -0
  26. data/.cache/lilac/concept/lilac/profanity/cohere.pkl +0 -3
  27. data/.cache/lilac/concept/lilac/profanity/gte-base.pkl +0 -3
  28. data/.cache/lilac/concept/lilac/profanity/gte-small.pkl +0 -3
  29. data/.cache/lilac/concept/lilac/profanity/openai.pkl +0 -3
  30. data/.cache/lilac/concept/lilac/profanity/palm.pkl +0 -3
  31. data/.cache/lilac/concept/lilac/profanity/sbert.pkl +0 -3
  32. data/.cache/lilac/concept/lilac/question/cohere.pkl +0 -3
  33. data/.cache/lilac/concept/lilac/question/gte-base.pkl +0 -3
  34. data/.cache/lilac/concept/lilac/question/gte-small.pkl +0 -0
  35. data/.cache/lilac/concept/lilac/question/openai.pkl +0 -3
  36. data/.cache/lilac/concept/lilac/question/palm.pkl +0 -3
  37. data/.cache/lilac/concept/lilac/question/sbert.pkl +0 -0
  38. data/.cache/lilac/concept/lilac/source-code/cohere.pkl +0 -3
  39. data/.cache/lilac/concept/lilac/source-code/gte-base.pkl +0 -0
  40. data/.cache/lilac/concept/lilac/source-code/gte-small.pkl +0 -0
  41. data/.cache/lilac/concept/lilac/source-code/openai.pkl +0 -0
  42. data/.cache/lilac/concept/lilac/source-code/palm.pkl +0 -0
  43. data/.cache/lilac/concept/lilac/source-code/sbert.pkl +0 -0
  44. data/.cache/lilac/concept/lilac/toxicity/cohere.pkl +0 -3
  45. data/.cache/lilac/concept/lilac/toxicity/gte-base.pkl +0 -3
  46. data/.cache/lilac/concept/lilac/toxicity/gte-small.pkl +0 -3
  47. data/.cache/lilac/concept/lilac/toxicity/openai.pkl +0 -3
  48. data/.cache/lilac/concept/lilac/toxicity/palm.pkl +0 -3
  49. data/.cache/lilac/concept/lilac/toxicity/sbert.pkl +0 -3
  50. data/lilac.yml +1969 -0
.gitattributes DELETED
@@ -1,21 +0,0 @@
1
- data/.cache/lilac/concept/lilac/negative-sentiment/cohere.pkl filter=lfs diff=lfs merge=lfs -text
2
- data/.cache/lilac/concept/lilac/non-english/cohere.pkl filter=lfs diff=lfs merge=lfs -text
3
- data/.cache/lilac/concept/lilac/non-english/openai.pkl filter=lfs diff=lfs merge=lfs -text
4
- data/.cache/lilac/concept/lilac/positive-sentiment/cohere.pkl filter=lfs diff=lfs merge=lfs -text
5
- data/.cache/lilac/concept/lilac/profanity/cohere.pkl filter=lfs diff=lfs merge=lfs -text
6
- data/.cache/lilac/concept/lilac/profanity/gte-base.pkl filter=lfs diff=lfs merge=lfs -text
7
- data/.cache/lilac/concept/lilac/profanity/gte-small.pkl filter=lfs diff=lfs merge=lfs -text
8
- data/.cache/lilac/concept/lilac/profanity/openai.pkl filter=lfs diff=lfs merge=lfs -text
9
- data/.cache/lilac/concept/lilac/profanity/palm.pkl filter=lfs diff=lfs merge=lfs -text
10
- data/.cache/lilac/concept/lilac/profanity/sbert.pkl filter=lfs diff=lfs merge=lfs -text
11
- data/.cache/lilac/concept/lilac/question/cohere.pkl filter=lfs diff=lfs merge=lfs -text
12
- data/.cache/lilac/concept/lilac/question/gte-base.pkl filter=lfs diff=lfs merge=lfs -text
13
- data/.cache/lilac/concept/lilac/question/openai.pkl filter=lfs diff=lfs merge=lfs -text
14
- data/.cache/lilac/concept/lilac/question/palm.pkl filter=lfs diff=lfs merge=lfs -text
15
- data/.cache/lilac/concept/lilac/source-code/cohere.pkl filter=lfs diff=lfs merge=lfs -text
16
- data/.cache/lilac/concept/lilac/toxicity/cohere.pkl filter=lfs diff=lfs merge=lfs -text
17
- data/.cache/lilac/concept/lilac/toxicity/gte-base.pkl filter=lfs diff=lfs merge=lfs -text
18
- data/.cache/lilac/concept/lilac/toxicity/gte-small.pkl filter=lfs diff=lfs merge=lfs -text
19
- data/.cache/lilac/concept/lilac/toxicity/openai.pkl filter=lfs diff=lfs merge=lfs -text
20
- data/.cache/lilac/concept/lilac/toxicity/palm.pkl filter=lfs diff=lfs merge=lfs -text
21
- data/.cache/lilac/concept/lilac/toxicity/sbert.pkl filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
data/.cache/lilac/concept/lilac/legal-termination/cohere.pkl DELETED
Binary file (610 kB)
 
data/.cache/lilac/concept/lilac/legal-termination/gte-base.pkl DELETED
Binary file (117 kB)
 
data/.cache/lilac/concept/lilac/legal-termination/gte-small.pkl DELETED
Binary file (60.6 kB)
 
data/.cache/lilac/concept/lilac/legal-termination/openai.pkl DELETED
Binary file (231 kB)
 
data/.cache/lilac/concept/lilac/legal-termination/palm.pkl DELETED
Binary file (117 kB)
 
data/.cache/lilac/concept/lilac/legal-termination/sbert.pkl DELETED
Binary file (60.6 kB)
 
data/.cache/lilac/concept/lilac/negative-sentiment/cohere.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:13bcab9d52ff84f47fe4311d1bbde68efde777a5f3e99bd843ecf69895a4f6a3
3
- size 2088021
 
 
 
 
data/.cache/lilac/concept/lilac/negative-sentiment/gte-base.pkl DELETED
Binary file (397 kB)
 
data/.cache/lilac/concept/lilac/negative-sentiment/gte-small.pkl DELETED
Binary file (202 kB)
 
data/.cache/lilac/concept/lilac/negative-sentiment/openai.pkl DELETED
Binary file (787 kB)
 
data/.cache/lilac/concept/lilac/negative-sentiment/palm.pkl DELETED
Binary file (397 kB)
 
data/.cache/lilac/concept/lilac/negative-sentiment/sbert.pkl DELETED
Binary file (202 kB)
 
data/.cache/lilac/concept/lilac/non-english/cohere.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:8073ad4261c03aac8350bcee76a40669df0a529b89b605e4a991189c7ad549ed
3
- size 3374534
 
 
 
 
data/.cache/lilac/concept/lilac/non-english/gte-base.pkl DELETED
Binary file (645 kB)
 
data/.cache/lilac/concept/lilac/non-english/gte-small.pkl DELETED
Binary file (330 kB)
 
data/.cache/lilac/concept/lilac/non-english/openai.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:3c924d11c7e0b61a76dfcafd4bd1cbf4f80afab97a5e537c0fb7ebb18db25a5d
3
- size 1275037
 
 
 
 
data/.cache/lilac/concept/lilac/non-english/palm.pkl DELETED
Binary file (645 kB)
 
data/.cache/lilac/concept/lilac/non-english/sbert.pkl DELETED
Binary file (330 kB)
 
data/.cache/lilac/concept/lilac/positive-sentiment/cohere.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:fc23e270e1824e258a51ea5419de53e74b6cc23fa31ff586b6c2f0f0f7549b91
3
- size 1857652
 
 
 
 
data/.cache/lilac/concept/lilac/positive-sentiment/gte-base.pkl DELETED
Binary file (353 kB)
 
data/.cache/lilac/concept/lilac/positive-sentiment/gte-small.pkl DELETED
Binary file (180 kB)
 
data/.cache/lilac/concept/lilac/positive-sentiment/openai.pkl DELETED
Binary file (700 kB)
 
data/.cache/lilac/concept/lilac/positive-sentiment/palm.pkl DELETED
Binary file (353 kB)
 
data/.cache/lilac/concept/lilac/positive-sentiment/sbert.pkl DELETED
Binary file (180 kB)
 
data/.cache/lilac/concept/lilac/profanity/cohere.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:f6c694a83f498be11182ea462dba84e93970c502f687504f5b684a47f175c411
3
- size 17413997
 
 
 
 
data/.cache/lilac/concept/lilac/profanity/gte-base.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:3287d4d06a78e0757f0b8586651e24fc7ac8f9d742a0091b24dd5bfc3b4c441f
3
- size 3301326
 
 
 
 
data/.cache/lilac/concept/lilac/profanity/gte-small.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f25837df92c799823a7ea284d3046d10fd2d146e97610d739fd088a44172e57
3
- size 1672960
 
 
 
 
data/.cache/lilac/concept/lilac/profanity/openai.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c199a5348b201c91db1926c12c47ec370b69badde06981d18dead800210acc2
3
- size 6558076
 
 
 
 
data/.cache/lilac/concept/lilac/profanity/palm.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:17cbb10cf538ab7e823d4db1fddf81977a155e3270a986b182370297e5a48380
3
- size 3301322
 
 
 
 
data/.cache/lilac/concept/lilac/profanity/sbert.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:132800020bbe32723942388c651eac45ae9da9aa98e7bfdd46b3f5820e02a339
3
- size 1672951
 
 
 
 
data/.cache/lilac/concept/lilac/question/cohere.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:f2ce2b4f9bf3dba7d6afa146aad9b443d35987b230366b668fbf15325b27fcf8
3
- size 6254200
 
 
 
 
data/.cache/lilac/concept/lilac/question/gte-base.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:fd6e9243c20ec84229419814178411b7f6f80a6d8e2f9e244fcc4f752d6ec5f0
3
- size 1194951
 
 
 
 
data/.cache/lilac/concept/lilac/question/gte-small.pkl DELETED
Binary file (611 kB)
 
data/.cache/lilac/concept/lilac/question/openai.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:b998b1370a2982689e6c5e0f099659f103130a52090f0f9f2b234abdc3c8d2b0
3
- size 2362458
 
 
 
 
data/.cache/lilac/concept/lilac/question/palm.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:98e077a03707541da691311fd28d9bed00ec9fb2a22a915adde2bc436f6362e6
3
- size 1194947
 
 
 
 
data/.cache/lilac/concept/lilac/question/sbert.pkl DELETED
Binary file (611 kB)
 
data/.cache/lilac/concept/lilac/source-code/cohere.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:ad4234a60f17ac8a068c3b407af1b63fd460800c9fd6c014da70d8eb3b0c0939
3
- size 1284715
 
 
 
 
data/.cache/lilac/concept/lilac/source-code/gte-base.pkl DELETED
Binary file (246 kB)
 
data/.cache/lilac/concept/lilac/source-code/gte-small.pkl DELETED
Binary file (126 kB)
 
data/.cache/lilac/concept/lilac/source-code/openai.pkl DELETED
Binary file (486 kB)
 
data/.cache/lilac/concept/lilac/source-code/palm.pkl DELETED
Binary file (246 kB)
 
data/.cache/lilac/concept/lilac/source-code/sbert.pkl DELETED
Binary file (126 kB)
 
data/.cache/lilac/concept/lilac/toxicity/cohere.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:cc3d3f95d84b64657ec4697ce899aee940d62725e0fb88c9f8b38f03298d89b3
3
- size 19602537
 
 
 
 
data/.cache/lilac/concept/lilac/toxicity/gte-base.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:0e9363d2faacb10fe0528f06df2237a44f9b1686f4100d3cca2cdb1a621a90c2
3
- size 3719127
 
 
 
 
data/.cache/lilac/concept/lilac/toxicity/gte-small.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:b094a716fcbda3cd5b686457bf2510c0a17cabddac21d88d8c97f6a6908266ec
3
- size 1886446
 
 
 
 
data/.cache/lilac/concept/lilac/toxicity/openai.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:08ee50c3a7679c15e442d12996ddac07bd9ffb8de30f8a607f6b4dd72e7f0343
3
- size 7384512
 
 
 
 
data/.cache/lilac/concept/lilac/toxicity/palm.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:e9d54189781c5a3e56f8640a7ed3516c82a411b09798e7dca84c6ba0f7efe48d
3
- size 3719128
 
 
 
 
data/.cache/lilac/concept/lilac/toxicity/sbert.pkl DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:654c96a6ef52b60a0f81d099c8bf4cda9957dde8d9aaea43f21cddc6c54c1ab5
3
- size 1886440
 
 
 
 
data/lilac.yml ADDED
@@ -0,0 +1,1969 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Lilac project config.
2
+ # See https://lilacml.com/api_reference/index.html#lilac.Config for details.
3
+
4
+ datasets:
5
+ - namespace: lilac
6
+ name: imdb
7
+ source:
8
+ dataset_name: imdb
9
+ source_name: huggingface
10
+ embeddings:
11
+ - path: text
12
+ embedding: gte-small
13
+ signals:
14
+ - path: text
15
+ signal:
16
+ signal_name: near_dup
17
+ - path: text
18
+ signal:
19
+ signal_name: pii
20
+ - path: text
21
+ signal:
22
+ signal_name: lang_detection
23
+ - path: text
24
+ signal:
25
+ embedding: gte-small
26
+ namespace: lilac
27
+ concept_name: positive-sentiment
28
+ signal_name: concept_score
29
+ - path: text
30
+ signal:
31
+ embedding: gte-small
32
+ namespace: lilac
33
+ concept_name: non-english
34
+ signal_name: concept_score
35
+ - path: text
36
+ signal:
37
+ embedding: gte-small
38
+ namespace: lilac
39
+ concept_name: toxicity
40
+ signal_name: concept_score
41
+ - path: text
42
+ signal:
43
+ embedding: gte-small
44
+ namespace: lilac
45
+ concept_name: question
46
+ signal_name: concept_score
47
+ - path: text
48
+ signal:
49
+ embedding: gte-small
50
+ namespace: lilac
51
+ concept_name: legal-termination
52
+ signal_name: concept_score
53
+ - path: text
54
+ signal:
55
+ embedding: gte-small
56
+ namespace: lilac
57
+ concept_name: source-code
58
+ signal_name: concept_score
59
+ - path: text
60
+ signal:
61
+ embedding: gte-small
62
+ namespace: lilac
63
+ concept_name: negative-sentiment
64
+ signal_name: concept_score
65
+ - path: text
66
+ signal:
67
+ embedding: gte-small
68
+ namespace: lilac
69
+ concept_name: profanity
70
+ signal_name: concept_score
71
+ - path: text
72
+ signal:
73
+ signal_name: text_statistics
74
+ settings:
75
+ ui:
76
+ media_paths:
77
+ - text
78
+ preferred_embedding: gte-small
79
+ - namespace: lilac
80
+ name: open-asssistant-conversations
81
+ source:
82
+ dataset_name: OpenAssistant/oasst1
83
+ source_name: huggingface
84
+ embeddings:
85
+ - path: text
86
+ embedding: gte-small
87
+ signals:
88
+ - path: text
89
+ signal:
90
+ signal_name: near_dup
91
+ - path: text
92
+ signal:
93
+ signal_name: pii
94
+ - path: text
95
+ signal:
96
+ signal_name: lang_detection
97
+ - path: text
98
+ signal:
99
+ embedding: gte-small
100
+ namespace: lilac
101
+ concept_name: positive-sentiment
102
+ signal_name: concept_score
103
+ - path: text
104
+ signal:
105
+ embedding: gte-small
106
+ namespace: lilac
107
+ concept_name: non-english
108
+ signal_name: concept_score
109
+ - path: text
110
+ signal:
111
+ embedding: gte-small
112
+ namespace: lilac
113
+ concept_name: toxicity
114
+ signal_name: concept_score
115
+ - path: text
116
+ signal:
117
+ embedding: gte-small
118
+ namespace: lilac
119
+ concept_name: question
120
+ signal_name: concept_score
121
+ - path: text
122
+ signal:
123
+ embedding: gte-small
124
+ namespace: lilac
125
+ concept_name: legal-termination
126
+ signal_name: concept_score
127
+ - path: text
128
+ signal:
129
+ embedding: gte-small
130
+ namespace: lilac
131
+ concept_name: source-code
132
+ signal_name: concept_score
133
+ - path: text
134
+ signal:
135
+ embedding: gte-small
136
+ namespace: lilac
137
+ concept_name: negative-sentiment
138
+ signal_name: concept_score
139
+ - path: text
140
+ signal:
141
+ embedding: gte-small
142
+ namespace: lilac
143
+ concept_name: negative-sentiment
144
+ signal_name: concept_score
145
+ - path: text
146
+ signal:
147
+ embedding: gte-small
148
+ namespace: lilac
149
+ concept_name: profanity
150
+ signal_name: concept_score
151
+ - path: text
152
+ signal:
153
+ signal_name: text_statistics
154
+ settings:
155
+ ui:
156
+ media_paths:
157
+ - text
158
+ preferred_embedding: gte-small
159
+ - namespace: lilac
160
+ name: wikitext-2-raw-v1
161
+ source:
162
+ dataset_name: wikitext
163
+ config_name: wikitext-2-raw-v1
164
+ source_name: huggingface
165
+ embeddings:
166
+ - path: text
167
+ embedding: gte-small
168
+ signals:
169
+ - path: text
170
+ signal:
171
+ signal_name: near_dup
172
+ - path: text
173
+ signal:
174
+ signal_name: pii
175
+ - path: text
176
+ signal:
177
+ signal_name: lang_detection
178
+ - path: text
179
+ signal:
180
+ signal_name: text_statistics
181
+ - path: text
182
+ signal:
183
+ embedding: gte-small
184
+ namespace: lilac
185
+ concept_name: legal-termination
186
+ signal_name: concept_score
187
+ - path: text
188
+ signal:
189
+ embedding: gte-small
190
+ namespace: lilac
191
+ concept_name: negative-sentiment
192
+ signal_name: concept_score
193
+ - path: text
194
+ signal:
195
+ embedding: gte-small
196
+ namespace: lilac
197
+ concept_name: non-english
198
+ signal_name: concept_score
199
+ - path: text
200
+ signal:
201
+ embedding: gte-small
202
+ namespace: lilac
203
+ concept_name: positive-sentiment
204
+ signal_name: concept_score
205
+ - path: text
206
+ signal:
207
+ embedding: gte-small
208
+ namespace: lilac
209
+ concept_name: profanity
210
+ signal_name: concept_score
211
+ - path: text
212
+ signal:
213
+ embedding: gte-small
214
+ namespace: lilac
215
+ concept_name: question
216
+ signal_name: concept_score
217
+ - path: text
218
+ signal:
219
+ embedding: gte-small
220
+ namespace: lilac
221
+ concept_name: source-code
222
+ signal_name: concept_score
223
+ - path: text
224
+ signal:
225
+ embedding: gte-small
226
+ namespace: lilac
227
+ concept_name: toxicity
228
+ signal_name: concept_score
229
+ settings:
230
+ ui:
231
+ media_paths:
232
+ - text
233
+ preferred_embedding: gte-small
234
+ - namespace: lilac
235
+ name: squad_v2
236
+ source:
237
+ dataset_name: squad_v2
238
+ source_name: huggingface
239
+ embeddings:
240
+ - path: context
241
+ embedding: gte-small
242
+ signals:
243
+ - path: context
244
+ signal:
245
+ signal_name: near_dup
246
+ - path: context
247
+ signal:
248
+ signal_name: pii
249
+ - path: context
250
+ signal:
251
+ signal_name: lang_detection
252
+ - path: context
253
+ signal:
254
+ embedding: gte-small
255
+ namespace: lilac
256
+ concept_name: positive-sentiment
257
+ signal_name: concept_score
258
+ - path: context
259
+ signal:
260
+ embedding: gte-small
261
+ namespace: lilac
262
+ concept_name: non-english
263
+ signal_name: concept_score
264
+ - path: context
265
+ signal:
266
+ embedding: gte-small
267
+ namespace: lilac
268
+ concept_name: toxicity
269
+ signal_name: concept_score
270
+ - path: context
271
+ signal:
272
+ embedding: gte-small
273
+ namespace: lilac
274
+ concept_name: question
275
+ signal_name: concept_score
276
+ - path: context
277
+ signal:
278
+ embedding: gte-small
279
+ namespace: lilac
280
+ concept_name: legal-termination
281
+ signal_name: concept_score
282
+ - path: context
283
+ signal:
284
+ embedding: gte-small
285
+ namespace: lilac
286
+ concept_name: source-code
287
+ signal_name: concept_score
288
+ - path: context
289
+ signal:
290
+ embedding: gte-small
291
+ namespace: lilac
292
+ concept_name: negative-sentiment
293
+ signal_name: concept_score
294
+ - path: context
295
+ signal:
296
+ embedding: gte-small
297
+ namespace: lilac
298
+ concept_name: profanity
299
+ signal_name: concept_score
300
+ - path: context
301
+ signal:
302
+ signal_name: text_statistics
303
+ - path: question
304
+ signal:
305
+ signal_name: near_dup
306
+ - path: question
307
+ signal:
308
+ signal_name: pii
309
+ - path: question
310
+ signal:
311
+ signal_name: lang_detection
312
+ - path: question
313
+ signal:
314
+ signal_name: text_statistics
315
+ - path:
316
+ - answers
317
+ - text
318
+ - '*'
319
+ signal:
320
+ signal_name: near_dup
321
+ - path:
322
+ - answers
323
+ - text
324
+ - '*'
325
+ signal:
326
+ signal_name: pii
327
+ - path:
328
+ - answers
329
+ - text
330
+ - '*'
331
+ signal:
332
+ signal_name: lang_detection
333
+ - path:
334
+ - answers
335
+ - text
336
+ - '*'
337
+ signal:
338
+ signal_name: text_statistics
339
+ - path: question
340
+ signal:
341
+ embedding: gte-small
342
+ namespace: lilac
343
+ concept_name: legal-termination
344
+ signal_name: concept_score
345
+ - path: question
346
+ signal:
347
+ embedding: gte-small
348
+ namespace: lilac
349
+ concept_name: negative-sentiment
350
+ signal_name: concept_score
351
+ - path: question
352
+ signal:
353
+ embedding: gte-small
354
+ namespace: lilac
355
+ concept_name: non-english
356
+ signal_name: concept_score
357
+ - path: question
358
+ signal:
359
+ embedding: gte-small
360
+ namespace: lilac
361
+ concept_name: positive-sentiment
362
+ signal_name: concept_score
363
+ - path: question
364
+ signal:
365
+ embedding: gte-small
366
+ namespace: lilac
367
+ concept_name: profanity
368
+ signal_name: concept_score
369
+ - path: question
370
+ signal:
371
+ embedding: gte-small
372
+ namespace: lilac
373
+ concept_name: question
374
+ signal_name: concept_score
375
+ - path: question
376
+ signal:
377
+ embedding: gte-small
378
+ namespace: lilac
379
+ concept_name: source-code
380
+ signal_name: concept_score
381
+ - path: question
382
+ signal:
383
+ embedding: gte-small
384
+ namespace: lilac
385
+ concept_name: toxicity
386
+ signal_name: concept_score
387
+ - path:
388
+ - answers
389
+ - text
390
+ - '*'
391
+ signal:
392
+ embedding: gte-small
393
+ namespace: lilac
394
+ concept_name: legal-termination
395
+ signal_name: concept_score
396
+ - path:
397
+ - answers
398
+ - text
399
+ - '*'
400
+ signal:
401
+ embedding: gte-small
402
+ namespace: lilac
403
+ concept_name: negative-sentiment
404
+ signal_name: concept_score
405
+ - path:
406
+ - answers
407
+ - text
408
+ - '*'
409
+ signal:
410
+ embedding: gte-small
411
+ namespace: lilac
412
+ concept_name: non-english
413
+ signal_name: concept_score
414
+ - path:
415
+ - answers
416
+ - text
417
+ - '*'
418
+ signal:
419
+ embedding: gte-small
420
+ namespace: lilac
421
+ concept_name: positive-sentiment
422
+ signal_name: concept_score
423
+ - path:
424
+ - answers
425
+ - text
426
+ - '*'
427
+ signal:
428
+ embedding: gte-small
429
+ namespace: lilac
430
+ concept_name: profanity
431
+ signal_name: concept_score
432
+ - path:
433
+ - answers
434
+ - text
435
+ - '*'
436
+ signal:
437
+ embedding: gte-small
438
+ namespace: lilac
439
+ concept_name: question
440
+ signal_name: concept_score
441
+ - path:
442
+ - answers
443
+ - text
444
+ - '*'
445
+ signal:
446
+ embedding: gte-small
447
+ namespace: lilac
448
+ concept_name: source-code
449
+ signal_name: concept_score
450
+ - path:
451
+ - answers
452
+ - text
453
+ - '*'
454
+ signal:
455
+ embedding: gte-small
456
+ namespace: lilac
457
+ concept_name: toxicity
458
+ signal_name: concept_score
459
+ settings:
460
+ ui:
461
+ media_paths:
462
+ - context
463
+ - question
464
+ - - answers
465
+ - text
466
+ - '*'
467
+ preferred_embedding: gte-small
468
+ - namespace: lilac
469
+ name: databricks-dolly-15k-curated-en
470
+ source:
471
+ dataset_name: argilla/databricks-dolly-15k-curated-en
472
+ source_name: huggingface
473
+ embeddings:
474
+ - path: original-context
475
+ embedding: gte-small
476
+ - path:
477
+ - new-context
478
+ - value
479
+ - '*'
480
+ embedding: gte-small
481
+ signals:
482
+ - path: original-instruction
483
+ signal:
484
+ signal_name: near_dup
485
+ - path: original-instruction
486
+ signal:
487
+ signal_name: pii
488
+ - path: original-instruction
489
+ signal:
490
+ signal_name: lang_detection
491
+ - path: original-instruction
492
+ signal:
493
+ signal_name: text_statistics
494
+ - path: original-context
495
+ signal:
496
+ signal_name: near_dup
497
+ - path: original-context
498
+ signal:
499
+ signal_name: pii
500
+ - path: original-context
501
+ signal:
502
+ signal_name: lang_detection
503
+ - path: original-context
504
+ signal:
505
+ signal_name: text_statistics
506
+ - path: original-response
507
+ signal:
508
+ signal_name: near_dup
509
+ - path: original-response
510
+ signal:
511
+ signal_name: pii
512
+ - path: original-response
513
+ signal:
514
+ signal_name: lang_detection
515
+ - path: original-response
516
+ signal:
517
+ signal_name: text_statistics
518
+ - path:
519
+ - new-instruction
520
+ - value
521
+ - '*'
522
+ signal:
523
+ signal_name: near_dup
524
+ - path:
525
+ - new-instruction
526
+ - value
527
+ - '*'
528
+ signal:
529
+ signal_name: pii
530
+ - path:
531
+ - new-instruction
532
+ - value
533
+ - '*'
534
+ signal:
535
+ signal_name: lang_detection
536
+ - path:
537
+ - new-instruction
538
+ - value
539
+ - '*'
540
+ signal:
541
+ signal_name: text_statistics
542
+ - path:
543
+ - new-context
544
+ - value
545
+ - '*'
546
+ signal:
547
+ signal_name: near_dup
548
+ - path:
549
+ - new-context
550
+ - value
551
+ - '*'
552
+ signal:
553
+ signal_name: pii
554
+ - path:
555
+ - new-context
556
+ - value
557
+ - '*'
558
+ signal:
559
+ signal_name: lang_detection
560
+ - path:
561
+ - new-context
562
+ - value
563
+ - '*'
564
+ signal:
565
+ signal_name: text_statistics
566
+ - path:
567
+ - new-response
568
+ - value
569
+ - '*'
570
+ signal:
571
+ signal_name: near_dup
572
+ - path:
573
+ - new-response
574
+ - value
575
+ - '*'
576
+ signal:
577
+ signal_name: pii
578
+ - path:
579
+ - new-response
580
+ - value
581
+ - '*'
582
+ signal:
583
+ signal_name: lang_detection
584
+ - path:
585
+ - new-response
586
+ - value
587
+ - '*'
588
+ signal:
589
+ signal_name: text_statistics
590
+ - path: original-instruction
591
+ signal:
592
+ embedding: gte-small
593
+ namespace: lilac
594
+ concept_name: legal-termination
595
+ signal_name: concept_score
596
+ - path: original-instruction
597
+ signal:
598
+ embedding: gte-small
599
+ namespace: lilac
600
+ concept_name: negative-sentiment
601
+ signal_name: concept_score
602
+ - path: original-instruction
603
+ signal:
604
+ embedding: gte-small
605
+ namespace: lilac
606
+ concept_name: non-english
607
+ signal_name: concept_score
608
+ - path: original-instruction
609
+ signal:
610
+ embedding: gte-small
611
+ namespace: lilac
612
+ concept_name: positive-sentiment
613
+ signal_name: concept_score
614
+ - path: original-instruction
615
+ signal:
616
+ embedding: gte-small
617
+ namespace: lilac
618
+ concept_name: profanity
619
+ signal_name: concept_score
620
+ - path: original-instruction
621
+ signal:
622
+ embedding: gte-small
623
+ namespace: lilac
624
+ concept_name: question
625
+ signal_name: concept_score
626
+ - path: original-instruction
627
+ signal:
628
+ embedding: gte-small
629
+ namespace: lilac
630
+ concept_name: source-code
631
+ signal_name: concept_score
632
+ - path: original-instruction
633
+ signal:
634
+ embedding: gte-small
635
+ namespace: lilac
636
+ concept_name: toxicity
637
+ signal_name: concept_score
638
+ - path: original-context
639
+ signal:
640
+ embedding: gte-small
641
+ namespace: lilac
642
+ concept_name: legal-termination
643
+ signal_name: concept_score
644
+ - path: original-context
645
+ signal:
646
+ embedding: gte-small
647
+ namespace: lilac
648
+ concept_name: negative-sentiment
649
+ signal_name: concept_score
650
+ - path: original-context
651
+ signal:
652
+ embedding: gte-small
653
+ namespace: lilac
654
+ concept_name: non-english
655
+ signal_name: concept_score
656
+ - path: original-context
657
+ signal:
658
+ embedding: gte-small
659
+ namespace: lilac
660
+ concept_name: positive-sentiment
661
+ signal_name: concept_score
662
+ - path: original-context
663
+ signal:
664
+ embedding: gte-small
665
+ namespace: lilac
666
+ concept_name: profanity
667
+ signal_name: concept_score
668
+ - path: original-context
669
+ signal:
670
+ embedding: gte-small
671
+ namespace: lilac
672
+ concept_name: question
673
+ signal_name: concept_score
674
+ - path: original-context
675
+ signal:
676
+ embedding: gte-small
677
+ namespace: lilac
678
+ concept_name: source-code
679
+ signal_name: concept_score
680
+ - path: original-context
681
+ signal:
682
+ embedding: gte-small
683
+ namespace: lilac
684
+ concept_name: toxicity
685
+ signal_name: concept_score
686
+ - path: original-response
687
+ signal:
688
+ embedding: gte-small
689
+ namespace: lilac
690
+ concept_name: legal-termination
691
+ signal_name: concept_score
692
+ - path: original-response
693
+ signal:
694
+ embedding: gte-small
695
+ namespace: lilac
696
+ concept_name: negative-sentiment
697
+ signal_name: concept_score
698
+ - path: original-response
699
+ signal:
700
+ embedding: gte-small
701
+ namespace: lilac
702
+ concept_name: non-english
703
+ signal_name: concept_score
704
+ - path: original-response
705
+ signal:
706
+ embedding: gte-small
707
+ namespace: lilac
708
+ concept_name: positive-sentiment
709
+ signal_name: concept_score
710
+ - path: original-response
711
+ signal:
712
+ embedding: gte-small
713
+ namespace: lilac
714
+ concept_name: profanity
715
+ signal_name: concept_score
716
+ - path: original-response
717
+ signal:
718
+ embedding: gte-small
719
+ namespace: lilac
720
+ concept_name: question
721
+ signal_name: concept_score
722
+ - path: original-response
723
+ signal:
724
+ embedding: gte-small
725
+ namespace: lilac
726
+ concept_name: source-code
727
+ signal_name: concept_score
728
+ - path: original-response
729
+ signal:
730
+ embedding: gte-small
731
+ namespace: lilac
732
+ concept_name: toxicity
733
+ signal_name: concept_score
734
+ - path:
735
+ - new-instruction
736
+ - value
737
+ - '*'
738
+ signal:
739
+ embedding: gte-small
740
+ namespace: lilac
741
+ concept_name: legal-termination
742
+ signal_name: concept_score
743
+ - path:
744
+ - new-instruction
745
+ - value
746
+ - '*'
747
+ signal:
748
+ embedding: gte-small
749
+ namespace: lilac
750
+ concept_name: negative-sentiment
751
+ signal_name: concept_score
752
+ - path:
753
+ - new-instruction
754
+ - value
755
+ - '*'
756
+ signal:
757
+ embedding: gte-small
758
+ namespace: lilac
759
+ concept_name: non-english
760
+ signal_name: concept_score
761
+ - path:
762
+ - new-instruction
763
+ - value
764
+ - '*'
765
+ signal:
766
+ embedding: gte-small
767
+ namespace: lilac
768
+ concept_name: positive-sentiment
769
+ signal_name: concept_score
770
+ - path:
771
+ - new-instruction
772
+ - value
773
+ - '*'
774
+ signal:
775
+ embedding: gte-small
776
+ namespace: lilac
777
+ concept_name: profanity
778
+ signal_name: concept_score
779
+ - path:
780
+ - new-instruction
781
+ - value
782
+ - '*'
783
+ signal:
784
+ embedding: gte-small
785
+ namespace: lilac
786
+ concept_name: question
787
+ signal_name: concept_score
788
+ - path:
789
+ - new-instruction
790
+ - value
791
+ - '*'
792
+ signal:
793
+ embedding: gte-small
794
+ namespace: lilac
795
+ concept_name: source-code
796
+ signal_name: concept_score
797
+ - path:
798
+ - new-instruction
799
+ - value
800
+ - '*'
801
+ signal:
802
+ embedding: gte-small
803
+ namespace: lilac
804
+ concept_name: toxicity
805
+ signal_name: concept_score
806
+ - path:
807
+ - new-context
808
+ - value
809
+ - '*'
810
+ signal:
811
+ embedding: gte-small
812
+ namespace: lilac
813
+ concept_name: legal-termination
814
+ signal_name: concept_score
815
+ - path:
816
+ - new-context
817
+ - value
818
+ - '*'
819
+ signal:
820
+ embedding: gte-small
821
+ namespace: lilac
822
+ concept_name: negative-sentiment
823
+ signal_name: concept_score
824
+ - path:
825
+ - new-context
826
+ - value
827
+ - '*'
828
+ signal:
829
+ embedding: gte-small
830
+ namespace: lilac
831
+ concept_name: non-english
832
+ signal_name: concept_score
833
+ - path:
834
+ - new-context
835
+ - value
836
+ - '*'
837
+ signal:
838
+ embedding: gte-small
839
+ namespace: lilac
840
+ concept_name: positive-sentiment
841
+ signal_name: concept_score
842
+ - path:
843
+ - new-context
844
+ - value
845
+ - '*'
846
+ signal:
847
+ embedding: gte-small
848
+ namespace: lilac
849
+ concept_name: profanity
850
+ signal_name: concept_score
851
+ - path:
852
+ - new-context
853
+ - value
854
+ - '*'
855
+ signal:
856
+ embedding: gte-small
857
+ namespace: lilac
858
+ concept_name: question
859
+ signal_name: concept_score
860
+ - path:
861
+ - new-context
862
+ - value
863
+ - '*'
864
+ signal:
865
+ embedding: gte-small
866
+ namespace: lilac
867
+ concept_name: source-code
868
+ signal_name: concept_score
869
+ - path:
870
+ - new-context
871
+ - value
872
+ - '*'
873
+ signal:
874
+ embedding: gte-small
875
+ namespace: lilac
876
+ concept_name: toxicity
877
+ signal_name: concept_score
878
+ - path:
879
+ - new-response
880
+ - value
881
+ - '*'
882
+ signal:
883
+ embedding: gte-small
884
+ namespace: lilac
885
+ concept_name: legal-termination
886
+ signal_name: concept_score
887
+ - path:
888
+ - new-response
889
+ - value
890
+ - '*'
891
+ signal:
892
+ embedding: gte-small
893
+ namespace: lilac
894
+ concept_name: negative-sentiment
895
+ signal_name: concept_score
896
+ - path:
897
+ - new-response
898
+ - value
899
+ - '*'
900
+ signal:
901
+ embedding: gte-small
902
+ namespace: lilac
903
+ concept_name: non-english
904
+ signal_name: concept_score
905
+ - path:
906
+ - new-response
907
+ - value
908
+ - '*'
909
+ signal:
910
+ embedding: gte-small
911
+ namespace: lilac
912
+ concept_name: positive-sentiment
913
+ signal_name: concept_score
914
+ - path:
915
+ - new-response
916
+ - value
917
+ - '*'
918
+ signal:
919
+ embedding: gte-small
920
+ namespace: lilac
921
+ concept_name: profanity
922
+ signal_name: concept_score
923
+ - path:
924
+ - new-response
925
+ - value
926
+ - '*'
927
+ signal:
928
+ embedding: gte-small
929
+ namespace: lilac
930
+ concept_name: question
931
+ signal_name: concept_score
932
+ - path:
933
+ - new-response
934
+ - value
935
+ - '*'
936
+ signal:
937
+ embedding: gte-small
938
+ namespace: lilac
939
+ concept_name: source-code
940
+ signal_name: concept_score
941
+ - path:
942
+ - new-response
943
+ - value
944
+ - '*'
945
+ signal:
946
+ embedding: gte-small
947
+ namespace: lilac
948
+ concept_name: toxicity
949
+ signal_name: concept_score
950
+ settings:
951
+ ui:
952
+ media_paths:
953
+ - original-instruction
954
+ - original-context
955
+ - original-response
956
+ - - new-instruction
957
+ - value
958
+ - '*'
959
+ - - new-context
960
+ - value
961
+ - '*'
962
+ - - new-response
963
+ - value
964
+ - '*'
965
+ preferred_embedding: gte-small
966
+ - namespace: lilac
967
+ name: piqa
968
+ source:
969
+ dataset_name: piqa
970
+ source_name: huggingface
971
+ embeddings:
972
+ - path: goal
973
+ embedding: gte-small
974
+ - path: sol1
975
+ embedding: gte-small
976
+ - path: sol2
977
+ embedding: gte-small
978
+ signals:
979
+ - path: goal
980
+ signal:
981
+ signal_name: near_dup
982
+ - path: goal
983
+ signal:
984
+ signal_name: pii
985
+ - path: goal
986
+ signal:
987
+ signal_name: lang_detection
988
+ - path: goal
989
+ signal:
990
+ embedding: gte-small
991
+ namespace: lilac
992
+ concept_name: positive-sentiment
993
+ signal_name: concept_score
994
+ - path: goal
995
+ signal:
996
+ embedding: gte-small
997
+ namespace: lilac
998
+ concept_name: non-english
999
+ signal_name: concept_score
1000
+ - path: goal
1001
+ signal:
1002
+ embedding: gte-small
1003
+ namespace: lilac
1004
+ concept_name: toxicity
1005
+ signal_name: concept_score
1006
+ - path: goal
1007
+ signal:
1008
+ embedding: gte-small
1009
+ namespace: lilac
1010
+ concept_name: question
1011
+ signal_name: concept_score
1012
+ - path: goal
1013
+ signal:
1014
+ embedding: gte-small
1015
+ namespace: lilac
1016
+ concept_name: legal-termination
1017
+ signal_name: concept_score
1018
+ - path: goal
1019
+ signal:
1020
+ embedding: gte-small
1021
+ namespace: lilac
1022
+ concept_name: source-code
1023
+ signal_name: concept_score
1024
+ - path: goal
1025
+ signal:
1026
+ embedding: gte-small
1027
+ namespace: lilac
1028
+ concept_name: negative-sentiment
1029
+ signal_name: concept_score
1030
+ - path: goal
1031
+ signal:
1032
+ embedding: gte-small
1033
+ namespace: lilac
1034
+ concept_name: profanity
1035
+ signal_name: concept_score
1036
+ - path: goal
1037
+ signal:
1038
+ signal_name: text_statistics
1039
+ - path: sol1
1040
+ signal:
1041
+ signal_name: near_dup
1042
+ - path: sol1
1043
+ signal:
1044
+ signal_name: pii
1045
+ - path: sol1
1046
+ signal:
1047
+ signal_name: lang_detection
1048
+ - path: sol1
1049
+ signal:
1050
+ embedding: gte-small
1051
+ namespace: lilac
1052
+ concept_name: positive-sentiment
1053
+ signal_name: concept_score
1054
+ - path: sol1
1055
+ signal:
1056
+ embedding: gte-small
1057
+ namespace: lilac
1058
+ concept_name: non-english
1059
+ signal_name: concept_score
1060
+ - path: sol1
1061
+ signal:
1062
+ embedding: gte-small
1063
+ namespace: lilac
1064
+ concept_name: toxicity
1065
+ signal_name: concept_score
1066
+ - path: sol1
1067
+ signal:
1068
+ embedding: gte-small
1069
+ namespace: lilac
1070
+ concept_name: question
1071
+ signal_name: concept_score
1072
+ - path: sol1
1073
+ signal:
1074
+ embedding: gte-small
1075
+ namespace: lilac
1076
+ concept_name: legal-termination
1077
+ signal_name: concept_score
1078
+ - path: sol1
1079
+ signal:
1080
+ embedding: gte-small
1081
+ namespace: lilac
1082
+ concept_name: source-code
1083
+ signal_name: concept_score
1084
+ - path: sol1
1085
+ signal:
1086
+ embedding: gte-small
1087
+ namespace: lilac
1088
+ concept_name: negative-sentiment
1089
+ signal_name: concept_score
1090
+ - path: sol1
1091
+ signal:
1092
+ embedding: gte-small
1093
+ namespace: lilac
1094
+ concept_name: profanity
1095
+ signal_name: concept_score
1096
+ - path: sol1
1097
+ signal:
1098
+ signal_name: text_statistics
1099
+ - path: sol2
1100
+ signal:
1101
+ signal_name: near_dup
1102
+ - path: sol2
1103
+ signal:
1104
+ signal_name: pii
1105
+ - path: sol2
1106
+ signal:
1107
+ signal_name: lang_detection
1108
+ - path: sol2
1109
+ signal:
1110
+ embedding: gte-small
1111
+ namespace: lilac
1112
+ concept_name: positive-sentiment
1113
+ signal_name: concept_score
1114
+ - path: sol2
1115
+ signal:
1116
+ embedding: gte-small
1117
+ namespace: lilac
1118
+ concept_name: non-english
1119
+ signal_name: concept_score
1120
+ - path: sol2
1121
+ signal:
1122
+ embedding: gte-small
1123
+ namespace: lilac
1124
+ concept_name: toxicity
1125
+ signal_name: concept_score
1126
+ - path: sol2
1127
+ signal:
1128
+ embedding: gte-small
1129
+ namespace: lilac
1130
+ concept_name: question
1131
+ signal_name: concept_score
1132
+ - path: sol2
1133
+ signal:
1134
+ embedding: gte-small
1135
+ namespace: lilac
1136
+ concept_name: legal-termination
1137
+ signal_name: concept_score
1138
+ - path: sol2
1139
+ signal:
1140
+ embedding: gte-small
1141
+ namespace: lilac
1142
+ concept_name: source-code
1143
+ signal_name: concept_score
1144
+ - path: sol2
1145
+ signal:
1146
+ embedding: gte-small
1147
+ namespace: lilac
1148
+ concept_name: negative-sentiment
1149
+ signal_name: concept_score
1150
+ - path: sol2
1151
+ signal:
1152
+ embedding: gte-small
1153
+ namespace: lilac
1154
+ concept_name: profanity
1155
+ signal_name: concept_score
1156
+ - path: sol2
1157
+ signal:
1158
+ signal_name: text_statistics
1159
+ settings:
1160
+ ui:
1161
+ media_paths:
1162
+ - sol1
1163
+ - sol2
1164
+ - goal
1165
+ preferred_embedding: gte-small
1166
+ - namespace: lilac
1167
+ name: OpenOrca-100k
1168
+ source:
1169
+ dataset_name: Open-Orca/OpenOrca
1170
+ sample_size: 100000
1171
+ source_name: huggingface
1172
+ embeddings:
1173
+ - path: question
1174
+ embedding: gte-small
1175
+ - path: response
1176
+ embedding: gte-small
1177
+ signals:
1178
+ - path: question
1179
+ signal:
1180
+ signal_name: near_dup
1181
+ - path: question
1182
+ signal:
1183
+ signal_name: pii
1184
+ - path: question
1185
+ signal:
1186
+ signal_name: lang_detection
1187
+ - path: question
1188
+ signal:
1189
+ embedding: gte-small
1190
+ namespace: lilac
1191
+ concept_name: positive-sentiment
1192
+ signal_name: concept_score
1193
+ - path: question
1194
+ signal:
1195
+ embedding: gte-small
1196
+ namespace: lilac
1197
+ concept_name: non-english
1198
+ signal_name: concept_score
1199
+ - path: question
1200
+ signal:
1201
+ embedding: gte-small
1202
+ namespace: lilac
1203
+ concept_name: toxicity
1204
+ signal_name: concept_score
1205
+ - path: question
1206
+ signal:
1207
+ embedding: gte-small
1208
+ namespace: lilac
1209
+ concept_name: question
1210
+ signal_name: concept_score
1211
+ - path: question
1212
+ signal:
1213
+ embedding: gte-small
1214
+ namespace: lilac
1215
+ concept_name: legal-termination
1216
+ signal_name: concept_score
1217
+ - path: question
1218
+ signal:
1219
+ embedding: gte-small
1220
+ namespace: lilac
1221
+ concept_name: source-code
1222
+ signal_name: concept_score
1223
+ - path: question
1224
+ signal:
1225
+ embedding: gte-small
1226
+ namespace: lilac
1227
+ concept_name: negative-sentiment
1228
+ signal_name: concept_score
1229
+ - path: question
1230
+ signal:
1231
+ embedding: gte-small
1232
+ namespace: lilac
1233
+ concept_name: profanity
1234
+ signal_name: concept_score
1235
+ - path: question
1236
+ signal:
1237
+ signal_name: text_statistics
1238
+ - path: response
1239
+ signal:
1240
+ signal_name: near_dup
1241
+ - path: response
1242
+ signal:
1243
+ signal_name: pii
1244
+ - path: response
1245
+ signal:
1246
+ signal_name: lang_detection
1247
+ - path: response
1248
+ signal:
1249
+ embedding: gte-small
1250
+ namespace: lilac
1251
+ concept_name: positive-sentiment
1252
+ signal_name: concept_score
1253
+ - path: response
1254
+ signal:
1255
+ embedding: gte-small
1256
+ namespace: lilac
1257
+ concept_name: non-english
1258
+ signal_name: concept_score
1259
+ - path: response
1260
+ signal:
1261
+ embedding: gte-small
1262
+ namespace: lilac
1263
+ concept_name: toxicity
1264
+ signal_name: concept_score
1265
+ - path: response
1266
+ signal:
1267
+ embedding: gte-small
1268
+ namespace: lilac
1269
+ concept_name: question
1270
+ signal_name: concept_score
1271
+ - path: response
1272
+ signal:
1273
+ embedding: gte-small
1274
+ namespace: lilac
1275
+ concept_name: legal-termination
1276
+ signal_name: concept_score
1277
+ - path: response
1278
+ signal:
1279
+ embedding: gte-small
1280
+ namespace: lilac
1281
+ concept_name: source-code
1282
+ signal_name: concept_score
1283
+ - path: response
1284
+ signal:
1285
+ embedding: gte-small
1286
+ namespace: lilac
1287
+ concept_name: negative-sentiment
1288
+ signal_name: concept_score
1289
+ - path: response
1290
+ signal:
1291
+ embedding: gte-small
1292
+ namespace: lilac
1293
+ concept_name: profanity
1294
+ signal_name: concept_score
1295
+ - path: response
1296
+ signal:
1297
+ signal_name: text_statistics
1298
+ settings:
1299
+ ui:
1300
+ media_paths:
1301
+ - question
1302
+ - response
1303
+ preferred_embedding: gte-small
1304
+ - namespace: lilac
1305
+ name: opus100-en-es-validation
1306
+ source:
1307
+ dataset_name: opus100
1308
+ config_name: en-es
1309
+ split: validation
1310
+ source_name: huggingface
1311
+ embeddings:
1312
+ - path:
1313
+ - translation
1314
+ - en
1315
+ embedding: gte-small
1316
+ - path:
1317
+ - translation
1318
+ - es
1319
+ embedding: gte-small
1320
+ signals:
1321
+ - path:
1322
+ - translation
1323
+ - en
1324
+ signal:
1325
+ signal_name: near_dup
1326
+ - path:
1327
+ - translation
1328
+ - en
1329
+ signal:
1330
+ signal_name: pii
1331
+ - path:
1332
+ - translation
1333
+ - en
1334
+ signal:
1335
+ signal_name: lang_detection
1336
+ - path:
1337
+ - translation
1338
+ - en
1339
+ signal:
1340
+ embedding: gte-small
1341
+ namespace: lilac
1342
+ concept_name: positive-sentiment
1343
+ signal_name: concept_score
1344
+ - path:
1345
+ - translation
1346
+ - en
1347
+ signal:
1348
+ embedding: gte-small
1349
+ namespace: lilac
1350
+ concept_name: non-english
1351
+ signal_name: concept_score
1352
+ - path:
1353
+ - translation
1354
+ - en
1355
+ signal:
1356
+ embedding: gte-small
1357
+ namespace: lilac
1358
+ concept_name: toxicity
1359
+ signal_name: concept_score
1360
+ - path:
1361
+ - translation
1362
+ - en
1363
+ signal:
1364
+ embedding: gte-small
1365
+ namespace: lilac
1366
+ concept_name: question
1367
+ signal_name: concept_score
1368
+ - path:
1369
+ - translation
1370
+ - en
1371
+ signal:
1372
+ embedding: gte-small
1373
+ namespace: lilac
1374
+ concept_name: legal-termination
1375
+ signal_name: concept_score
1376
+ - path:
1377
+ - translation
1378
+ - en
1379
+ signal:
1380
+ embedding: gte-small
1381
+ namespace: lilac
1382
+ concept_name: source-code
1383
+ signal_name: concept_score
1384
+ - path:
1385
+ - translation
1386
+ - en
1387
+ signal:
1388
+ embedding: gte-small
1389
+ namespace: lilac
1390
+ concept_name: negative-sentiment
1391
+ signal_name: concept_score
1392
+ - path:
1393
+ - translation
1394
+ - en
1395
+ signal:
1396
+ embedding: gte-small
1397
+ namespace: lilac
1398
+ concept_name: profanity
1399
+ signal_name: concept_score
1400
+ - path:
1401
+ - translation
1402
+ - en
1403
+ signal:
1404
+ signal_name: text_statistics
1405
+ - path:
1406
+ - translation
1407
+ - es
1408
+ signal:
1409
+ signal_name: near_dup
1410
+ - path:
1411
+ - translation
1412
+ - es
1413
+ signal:
1414
+ signal_name: pii
1415
+ - path:
1416
+ - translation
1417
+ - es
1418
+ signal:
1419
+ signal_name: lang_detection
1420
+ - path:
1421
+ - translation
1422
+ - es
1423
+ signal:
1424
+ embedding: gte-small
1425
+ namespace: lilac
1426
+ concept_name: positive-sentiment
1427
+ signal_name: concept_score
1428
+ - path:
1429
+ - translation
1430
+ - es
1431
+ signal:
1432
+ embedding: gte-small
1433
+ namespace: lilac
1434
+ concept_name: non-english
1435
+ signal_name: concept_score
1436
+ - path:
1437
+ - translation
1438
+ - es
1439
+ signal:
1440
+ embedding: gte-small
1441
+ namespace: lilac
1442
+ concept_name: toxicity
1443
+ signal_name: concept_score
1444
+ - path:
1445
+ - translation
1446
+ - es
1447
+ signal:
1448
+ embedding: gte-small
1449
+ namespace: lilac
1450
+ concept_name: question
1451
+ signal_name: concept_score
1452
+ - path:
1453
+ - translation
1454
+ - es
1455
+ signal:
1456
+ embedding: gte-small
1457
+ namespace: lilac
1458
+ concept_name: legal-termination
1459
+ signal_name: concept_score
1460
+ - path:
1461
+ - translation
1462
+ - es
1463
+ signal:
1464
+ embedding: gte-small
1465
+ namespace: lilac
1466
+ concept_name: source-code
1467
+ signal_name: concept_score
1468
+ - path:
1469
+ - translation
1470
+ - es
1471
+ signal:
1472
+ embedding: gte-small
1473
+ namespace: lilac
1474
+ concept_name: negative-sentiment
1475
+ signal_name: concept_score
1476
+ - path:
1477
+ - translation
1478
+ - es
1479
+ signal:
1480
+ embedding: gte-small
1481
+ namespace: lilac
1482
+ concept_name: profanity
1483
+ signal_name: concept_score
1484
+ - path:
1485
+ - translation
1486
+ - es
1487
+ signal:
1488
+ signal_name: text_statistics
1489
+ settings:
1490
+ ui:
1491
+ media_paths:
1492
+ - - translation
1493
+ - es
1494
+ - - translation
1495
+ - en
1496
+ preferred_embedding: gte-small
1497
+ - namespace: lilac
1498
+ name: mmlu_professional_law
1499
+ source:
1500
+ dataset_name: cais/mmlu
1501
+ config_name: professional_law
1502
+ source_name: huggingface
1503
+ embeddings:
1504
+ - path: question
1505
+ embedding: gte-small
1506
+ - path:
1507
+ - choices
1508
+ - '*'
1509
+ embedding: gte-small
1510
+ signals:
1511
+ - path: question
1512
+ signal:
1513
+ signal_name: near_dup
1514
+ - path: question
1515
+ signal:
1516
+ signal_name: pii
1517
+ - path: question
1518
+ signal:
1519
+ signal_name: lang_detection
1520
+ - path: question
1521
+ signal:
1522
+ embedding: gte-small
1523
+ namespace: lilac
1524
+ concept_name: positive-sentiment
1525
+ signal_name: concept_score
1526
+ - path: question
1527
+ signal:
1528
+ embedding: gte-small
1529
+ namespace: lilac
1530
+ concept_name: non-english
1531
+ signal_name: concept_score
1532
+ - path: question
1533
+ signal:
1534
+ embedding: gte-small
1535
+ namespace: lilac
1536
+ concept_name: toxicity
1537
+ signal_name: concept_score
1538
+ - path: question
1539
+ signal:
1540
+ embedding: gte-small
1541
+ namespace: lilac
1542
+ concept_name: question
1543
+ signal_name: concept_score
1544
+ - path: question
1545
+ signal:
1546
+ embedding: gte-small
1547
+ namespace: lilac
1548
+ concept_name: legal-termination
1549
+ signal_name: concept_score
1550
+ - path: question
1551
+ signal:
1552
+ embedding: gte-small
1553
+ namespace: lilac
1554
+ concept_name: source-code
1555
+ signal_name: concept_score
1556
+ - path: question
1557
+ signal:
1558
+ embedding: gte-small
1559
+ namespace: lilac
1560
+ concept_name: negative-sentiment
1561
+ signal_name: concept_score
1562
+ - path: question
1563
+ signal:
1564
+ embedding: gte-small
1565
+ namespace: lilac
1566
+ concept_name: profanity
1567
+ signal_name: concept_score
1568
+ - path: question
1569
+ signal:
1570
+ signal_name: text_statistics
1571
+ - path:
1572
+ - choices
1573
+ - '*'
1574
+ signal:
1575
+ signal_name: near_dup
1576
+ - path:
1577
+ - choices
1578
+ - '*'
1579
+ signal:
1580
+ signal_name: pii
1581
+ - path:
1582
+ - choices
1583
+ - '*'
1584
+ signal:
1585
+ signal_name: lang_detection
1586
+ - path:
1587
+ - choices
1588
+ - '*'
1589
+ signal:
1590
+ embedding: gte-small
1591
+ namespace: lilac
1592
+ concept_name: positive-sentiment
1593
+ signal_name: concept_score
1594
+ - path:
1595
+ - choices
1596
+ - '*'
1597
+ signal:
1598
+ embedding: gte-small
1599
+ namespace: lilac
1600
+ concept_name: non-english
1601
+ signal_name: concept_score
1602
+ - path:
1603
+ - choices
1604
+ - '*'
1605
+ signal:
1606
+ embedding: gte-small
1607
+ namespace: lilac
1608
+ concept_name: toxicity
1609
+ signal_name: concept_score
1610
+ - path:
1611
+ - choices
1612
+ - '*'
1613
+ signal:
1614
+ embedding: gte-small
1615
+ namespace: lilac
1616
+ concept_name: question
1617
+ signal_name: concept_score
1618
+ - path:
1619
+ - choices
1620
+ - '*'
1621
+ signal:
1622
+ embedding: gte-small
1623
+ namespace: lilac
1624
+ concept_name: legal-termination
1625
+ signal_name: concept_score
1626
+ - path:
1627
+ - choices
1628
+ - '*'
1629
+ signal:
1630
+ embedding: gte-small
1631
+ namespace: lilac
1632
+ concept_name: source-code
1633
+ signal_name: concept_score
1634
+ - path:
1635
+ - choices
1636
+ - '*'
1637
+ signal:
1638
+ embedding: gte-small
1639
+ namespace: lilac
1640
+ concept_name: negative-sentiment
1641
+ signal_name: concept_score
1642
+ - path:
1643
+ - choices
1644
+ - '*'
1645
+ signal:
1646
+ embedding: gte-small
1647
+ namespace: lilac
1648
+ concept_name: negative-sentiment
1649
+ signal_name: concept_score
1650
+ - path:
1651
+ - choices
1652
+ - '*'
1653
+ signal:
1654
+ embedding: gte-small
1655
+ namespace: lilac
1656
+ concept_name: profanity
1657
+ signal_name: concept_score
1658
+ - path:
1659
+ - choices
1660
+ - '*'
1661
+ signal:
1662
+ signal_name: text_statistics
1663
+ settings:
1664
+ ui:
1665
+ media_paths:
1666
+ - question
1667
+ - - choices
1668
+ - '*'
1669
+ preferred_embedding: gte-small
1670
+ - namespace: lilac
1671
+ name: pile-of-law-r-legaladvice
1672
+ source:
1673
+ dataset_name: pile-of-law/pile-of-law
1674
+ config_name: r_legaladvice
1675
+ source_name: huggingface
1676
+ embeddings:
1677
+ - path: text
1678
+ embedding: gte-small
1679
+ signals:
1680
+ - path: text
1681
+ signal:
1682
+ signal_name: near_dup
1683
+ - path: text
1684
+ signal:
1685
+ signal_name: pii
1686
+ - path: text
1687
+ signal:
1688
+ signal_name: lang_detection
1689
+ - path: text
1690
+ signal:
1691
+ embedding: gte-small
1692
+ namespace: lilac
1693
+ concept_name: positive-sentiment
1694
+ signal_name: concept_score
1695
+ - path: text
1696
+ signal:
1697
+ embedding: gte-small
1698
+ namespace: lilac
1699
+ concept_name: non-english
1700
+ signal_name: concept_score
1701
+ - path: text
1702
+ signal:
1703
+ embedding: gte-small
1704
+ namespace: lilac
1705
+ concept_name: toxicity
1706
+ signal_name: concept_score
1707
+ - path: text
1708
+ signal:
1709
+ embedding: gte-small
1710
+ namespace: lilac
1711
+ concept_name: question
1712
+ signal_name: concept_score
1713
+ - path: text
1714
+ signal:
1715
+ embedding: gte-small
1716
+ namespace: lilac
1717
+ concept_name: legal-termination
1718
+ signal_name: concept_score
1719
+ - path: text
1720
+ signal:
1721
+ embedding: gte-small
1722
+ namespace: lilac
1723
+ concept_name: source-code
1724
+ signal_name: concept_score
1725
+ - path: text
1726
+ signal:
1727
+ embedding: gte-small
1728
+ namespace: lilac
1729
+ concept_name: negative-sentiment
1730
+ signal_name: concept_score
1731
+ - path: text
1732
+ signal:
1733
+ embedding: gte-small
1734
+ namespace: lilac
1735
+ concept_name: profanity
1736
+ signal_name: concept_score
1737
+ - path: text
1738
+ signal:
1739
+ signal_name: text_statistics
1740
+ settings:
1741
+ ui:
1742
+ media_paths:
1743
+ - text
1744
+ preferred_embedding: gte-small
1745
+ - namespace: lilac
1746
+ name: science-qa-derek-thomas
1747
+ source:
1748
+ dataset_name: derek-thomas/ScienceQA
1749
+ source_name: huggingface
1750
+ embeddings:
1751
+ - path: lecture
1752
+ embedding: gte-small
1753
+ signals:
1754
+ - path: lecture
1755
+ signal:
1756
+ signal_name: near_dup
1757
+ - path: lecture
1758
+ signal:
1759
+ signal_name: pii
1760
+ - path: lecture
1761
+ signal:
1762
+ signal_name: lang_detection
1763
+ - path: lecture
1764
+ signal:
1765
+ signal_name: text_statistics
1766
+ - path: lecture
1767
+ signal:
1768
+ embedding: gte-small
1769
+ namespace: lilac
1770
+ concept_name: legal-termination
1771
+ signal_name: concept_score
1772
+ - path: lecture
1773
+ signal:
1774
+ embedding: gte-small
1775
+ namespace: lilac
1776
+ concept_name: negative-sentiment
1777
+ signal_name: concept_score
1778
+ - path: lecture
1779
+ signal:
1780
+ embedding: gte-small
1781
+ namespace: lilac
1782
+ concept_name: non-english
1783
+ signal_name: concept_score
1784
+ - path: lecture
1785
+ signal:
1786
+ embedding: gte-small
1787
+ namespace: lilac
1788
+ concept_name: positive-sentiment
1789
+ signal_name: concept_score
1790
+ - path: lecture
1791
+ signal:
1792
+ embedding: gte-small
1793
+ namespace: lilac
1794
+ concept_name: profanity
1795
+ signal_name: concept_score
1796
+ - path: lecture
1797
+ signal:
1798
+ embedding: gte-small
1799
+ namespace: lilac
1800
+ concept_name: question
1801
+ signal_name: concept_score
1802
+ - path: lecture
1803
+ signal:
1804
+ embedding: gte-small
1805
+ namespace: lilac
1806
+ concept_name: source-code
1807
+ signal_name: concept_score
1808
+ - path: lecture
1809
+ signal:
1810
+ embedding: gte-small
1811
+ namespace: lilac
1812
+ concept_name: toxicity
1813
+ signal_name: concept_score
1814
+ settings:
1815
+ ui:
1816
+ media_paths:
1817
+ - lecture
1818
+ preferred_embedding: gte-small
1819
+ - namespace: lilac
1820
+ name: enron-emails
1821
+ source:
1822
+ dataset_name: EleutherAI/pile
1823
+ config_name: enron_emails
1824
+ sample_size: 100000
1825
+ source_name: huggingface
1826
+ embeddings:
1827
+ - path: text
1828
+ embedding: gte-small
1829
+ signals:
1830
+ - path: text
1831
+ signal:
1832
+ signal_name: near_dup
1833
+ - path: text
1834
+ signal:
1835
+ signal_name: pii
1836
+ - path: text
1837
+ signal:
1838
+ signal_name: lang_detection
1839
+ - path: text
1840
+ signal:
1841
+ embedding: gte-small
1842
+ namespace: lilac
1843
+ concept_name: positive-sentiment
1844
+ signal_name: concept_score
1845
+ - path: text
1846
+ signal:
1847
+ embedding: gte-small
1848
+ namespace: lilac
1849
+ concept_name: non-english
1850
+ signal_name: concept_score
1851
+ - path: text
1852
+ signal:
1853
+ embedding: gte-small
1854
+ namespace: lilac
1855
+ concept_name: toxicity
1856
+ signal_name: concept_score
1857
+ - path: text
1858
+ signal:
1859
+ embedding: gte-small
1860
+ namespace: lilac
1861
+ concept_name: question
1862
+ signal_name: concept_score
1863
+ - path: text
1864
+ signal:
1865
+ embedding: gte-small
1866
+ namespace: lilac
1867
+ concept_name: legal-termination
1868
+ signal_name: concept_score
1869
+ - path: text
1870
+ signal:
1871
+ embedding: gte-small
1872
+ namespace: lilac
1873
+ concept_name: source-code
1874
+ signal_name: concept_score
1875
+ - path: text
1876
+ signal:
1877
+ embedding: gte-small
1878
+ namespace: lilac
1879
+ concept_name: negative-sentiment
1880
+ signal_name: concept_score
1881
+ - path: text
1882
+ signal:
1883
+ embedding: gte-small
1884
+ namespace: lilac
1885
+ concept_name: profanity
1886
+ signal_name: concept_score
1887
+ - path: text
1888
+ signal:
1889
+ signal_name: text_statistics
1890
+ settings:
1891
+ ui:
1892
+ media_paths:
1893
+ - text
1894
+ preferred_embedding: gte-small
1895
+ - namespace: lilac
1896
+ name: the_movies_dataset
1897
+ source:
1898
+ filepaths:
1899
+ - https://storage.googleapis.com/lilac-data/datasets/the_movies_dataset/the_movies_dataset.csv
1900
+ source_name: csv
1901
+ embeddings:
1902
+ - path: overview
1903
+ embedding: gte-small
1904
+ signals:
1905
+ - path: overview
1906
+ signal:
1907
+ signal_name: near_dup
1908
+ - path: overview
1909
+ signal:
1910
+ signal_name: pii
1911
+ - path: overview
1912
+ signal:
1913
+ signal_name: lang_detection
1914
+ - path: overview
1915
+ signal:
1916
+ signal_name: text_statistics
1917
+ - path: overview
1918
+ signal:
1919
+ embedding: gte-small
1920
+ namespace: lilac
1921
+ concept_name: legal-termination
1922
+ signal_name: concept_score
1923
+ - path: overview
1924
+ signal:
1925
+ embedding: gte-small
1926
+ namespace: lilac
1927
+ concept_name: negative-sentiment
1928
+ signal_name: concept_score
1929
+ - path: overview
1930
+ signal:
1931
+ embedding: gte-small
1932
+ namespace: lilac
1933
+ concept_name: non-english
1934
+ signal_name: concept_score
1935
+ - path: overview
1936
+ signal:
1937
+ embedding: gte-small
1938
+ namespace: lilac
1939
+ concept_name: positive-sentiment
1940
+ signal_name: concept_score
1941
+ - path: overview
1942
+ signal:
1943
+ embedding: gte-small
1944
+ namespace: lilac
1945
+ concept_name: profanity
1946
+ signal_name: concept_score
1947
+ - path: overview
1948
+ signal:
1949
+ embedding: gte-small
1950
+ namespace: lilac
1951
+ concept_name: question
1952
+ signal_name: concept_score
1953
+ - path: overview
1954
+ signal:
1955
+ embedding: gte-small
1956
+ namespace: lilac
1957
+ concept_name: source-code
1958
+ signal_name: concept_score
1959
+ - path: overview
1960
+ signal:
1961
+ embedding: gte-small
1962
+ namespace: lilac
1963
+ concept_name: toxicity
1964
+ signal_name: concept_score
1965
+ settings:
1966
+ ui:
1967
+ media_paths:
1968
+ - overview
1969
+ preferred_embedding: gte-small