Spaces:
Running
Running
Push
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .env +1 -1
- .gitattributes +0 -116
- data/.cache/lilac/concept/lilac/legal-termination/cohere.pkl +0 -0
- data/.cache/lilac/concept/lilac/legal-termination/gte-base.pkl +0 -0
- data/.cache/lilac/concept/lilac/legal-termination/gte-small.pkl +0 -0
- data/.cache/lilac/concept/lilac/legal-termination/openai.pkl +0 -0
- data/.cache/lilac/concept/lilac/legal-termination/palm.pkl +0 -0
- data/.cache/lilac/concept/lilac/legal-termination/sbert.pkl +0 -0
- data/.cache/lilac/concept/lilac/negative-sentiment/cohere.pkl +0 -3
- data/.cache/lilac/concept/lilac/negative-sentiment/gte-base.pkl +0 -0
- data/.cache/lilac/concept/lilac/negative-sentiment/gte-small.pkl +0 -0
- data/.cache/lilac/concept/lilac/negative-sentiment/openai.pkl +0 -0
- data/.cache/lilac/concept/lilac/negative-sentiment/palm.pkl +0 -0
- data/.cache/lilac/concept/lilac/negative-sentiment/sbert.pkl +0 -0
- data/.cache/lilac/concept/lilac/positive-sentiment/cohere.pkl +0 -3
- data/.cache/lilac/concept/lilac/positive-sentiment/gte-base.pkl +0 -0
- data/.cache/lilac/concept/lilac/positive-sentiment/gte-small.pkl +0 -0
- data/.cache/lilac/concept/lilac/positive-sentiment/openai.pkl +0 -0
- data/.cache/lilac/concept/lilac/positive-sentiment/palm.pkl +0 -0
- data/.cache/lilac/concept/lilac/positive-sentiment/sbert.pkl +0 -0
- data/.cache/lilac/concept/lilac/profanity/cohere.pkl +0 -3
- data/.cache/lilac/concept/lilac/profanity/gte-base.pkl +0 -3
- data/.cache/lilac/concept/lilac/profanity/gte-small.pkl +0 -3
- data/.cache/lilac/concept/lilac/profanity/openai.pkl +0 -3
- data/.cache/lilac/concept/lilac/profanity/palm.pkl +0 -3
- data/.cache/lilac/concept/lilac/profanity/sbert.pkl +0 -3
- data/.cache/lilac/concept/lilac/question/cohere.pkl +0 -3
- data/.cache/lilac/concept/lilac/question/gte-base.pkl +0 -3
- data/.cache/lilac/concept/lilac/question/gte-small.pkl +0 -0
- data/.cache/lilac/concept/lilac/question/openai.pkl +0 -3
- data/.cache/lilac/concept/lilac/question/palm.pkl +0 -3
- data/.cache/lilac/concept/lilac/question/sbert.pkl +0 -0
- data/.cache/lilac/concept/lilac/source-code/cohere.pkl +0 -0
- data/.cache/lilac/concept/lilac/source-code/gte-base.pkl +0 -0
- data/.cache/lilac/concept/lilac/source-code/gte-small.pkl +0 -0
- data/.cache/lilac/concept/lilac/source-code/openai.pkl +0 -0
- data/.cache/lilac/concept/lilac/source-code/palm.pkl +0 -0
- data/.cache/lilac/concept/lilac/source-code/sbert.pkl +0 -0
- data/.cache/lilac/concept/lilac/toxicity/cohere.pkl +0 -3
- data/.cache/lilac/concept/lilac/toxicity/gte-base.pkl +0 -3
- data/.cache/lilac/concept/lilac/toxicity/gte-small.pkl +0 -3
- data/.cache/lilac/concept/lilac/toxicity/openai.pkl +0 -3
- data/.cache/lilac/concept/lilac/toxicity/palm.pkl +0 -3
- data/.cache/lilac/concept/lilac/toxicity/sbert.pkl +0 -3
- data/datasets/lilac/OpenOrca-100k/config.yml +0 -28
- data/datasets/lilac/OpenOrca-100k/data-00000-of-00001.parquet +0 -3
- data/datasets/lilac/OpenOrca-100k/manifest.json +0 -24
- data/datasets/lilac/OpenOrca-100k/question/gte-small/hnsw.hnswlib.bin +0 -3
- data/datasets/lilac/OpenOrca-100k/question/gte-small/hnsw.lookup.pkl +0 -3
- data/datasets/lilac/OpenOrca-100k/question/gte-small/signal_manifest.json +0 -32
.env
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
# To overwrite these variables, create a .env.local file
|
2 |
|
3 |
# The path to the directory where the data will be downloaded on machine
|
4 |
-
LILAC_DATA_PATH=./
|
5 |
|
6 |
# Set to 1 for duckdb to use views instead of materialized tables (lower memory usage, but slower).
|
7 |
DUCKDB_USE_VIEWS=0
|
|
|
1 |
# To overwrite these variables, create a .env.local file
|
2 |
|
3 |
# The path to the directory where the data will be downloaded on machine
|
4 |
+
LILAC_DATA_PATH=./data
|
5 |
|
6 |
# Set to 1 for duckdb to use views instead of materialized tables (lower memory usage, but slower).
|
7 |
DUCKDB_USE_VIEWS=0
|
.gitattributes
DELETED
@@ -1,116 +0,0 @@
|
|
1 |
-
data/.cache/lilac/concept/lilac/negative-sentiment/cohere.pkl filter=lfs diff=lfs merge=lfs -text
|
2 |
-
data/.cache/lilac/concept/lilac/positive-sentiment/cohere.pkl filter=lfs diff=lfs merge=lfs -text
|
3 |
-
data/.cache/lilac/concept/lilac/profanity/cohere.pkl filter=lfs diff=lfs merge=lfs -text
|
4 |
-
data/.cache/lilac/concept/lilac/profanity/gte-base.pkl filter=lfs diff=lfs merge=lfs -text
|
5 |
-
data/.cache/lilac/concept/lilac/profanity/gte-small.pkl filter=lfs diff=lfs merge=lfs -text
|
6 |
-
data/.cache/lilac/concept/lilac/profanity/openai.pkl filter=lfs diff=lfs merge=lfs -text
|
7 |
-
data/.cache/lilac/concept/lilac/profanity/palm.pkl filter=lfs diff=lfs merge=lfs -text
|
8 |
-
data/.cache/lilac/concept/lilac/profanity/sbert.pkl filter=lfs diff=lfs merge=lfs -text
|
9 |
-
data/.cache/lilac/concept/lilac/question/cohere.pkl filter=lfs diff=lfs merge=lfs -text
|
10 |
-
data/.cache/lilac/concept/lilac/question/gte-base.pkl filter=lfs diff=lfs merge=lfs -text
|
11 |
-
data/.cache/lilac/concept/lilac/question/openai.pkl filter=lfs diff=lfs merge=lfs -text
|
12 |
-
data/.cache/lilac/concept/lilac/question/palm.pkl filter=lfs diff=lfs merge=lfs -text
|
13 |
-
data/.cache/lilac/concept/lilac/toxicity/cohere.pkl filter=lfs diff=lfs merge=lfs -text
|
14 |
-
data/.cache/lilac/concept/lilac/toxicity/gte-base.pkl filter=lfs diff=lfs merge=lfs -text
|
15 |
-
data/.cache/lilac/concept/lilac/toxicity/gte-small.pkl filter=lfs diff=lfs merge=lfs -text
|
16 |
-
data/.cache/lilac/concept/lilac/toxicity/openai.pkl filter=lfs diff=lfs merge=lfs -text
|
17 |
-
data/.cache/lilac/concept/lilac/toxicity/palm.pkl filter=lfs diff=lfs merge=lfs -text
|
18 |
-
data/.cache/lilac/concept/lilac/toxicity/sbert.pkl filter=lfs diff=lfs merge=lfs -text
|
19 |
-
data/datasets/lilac/piqa/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
20 |
-
data/datasets/lilac/piqa/goal/gte-small/hnsw.hnswlib.bin filter=lfs diff=lfs merge=lfs -text
|
21 |
-
data/datasets/lilac/piqa/goal/gte-small/hnsw.lookup.pkl filter=lfs diff=lfs merge=lfs -text
|
22 |
-
data/datasets/lilac/piqa/goal/gte-small/spans.pkl filter=lfs diff=lfs merge=lfs -text
|
23 |
-
data/datasets/lilac/piqa/sol1/gte-small/hnsw.hnswlib.bin filter=lfs diff=lfs merge=lfs -text
|
24 |
-
data/datasets/lilac/piqa/sol1/gte-small/hnsw.lookup.pkl filter=lfs diff=lfs merge=lfs -text
|
25 |
-
data/datasets/lilac/piqa/sol1/gte-small/spans.pkl filter=lfs diff=lfs merge=lfs -text
|
26 |
-
data/datasets/lilac/piqa/sol2/gte-small/hnsw.hnswlib.bin filter=lfs diff=lfs merge=lfs -text
|
27 |
-
data/datasets/lilac/piqa/sol2/gte-small/hnsw.lookup.pkl filter=lfs diff=lfs merge=lfs -text
|
28 |
-
data/datasets/lilac/piqa/sol2/gte-small/spans.pkl filter=lfs diff=lfs merge=lfs -text
|
29 |
-
data/datasets/lilac/enron-emails/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
30 |
-
data/datasets/lilac/enron-emails/text/gte-small/hnsw.hnswlib.bin filter=lfs diff=lfs merge=lfs -text
|
31 |
-
data/datasets/lilac/enron-emails/text/gte-small/hnsw.lookup.pkl filter=lfs diff=lfs merge=lfs -text
|
32 |
-
data/datasets/lilac/enron-emails/text/gte-small/spans.pkl filter=lfs diff=lfs merge=lfs -text
|
33 |
-
data/datasets/lilac/enron-emails/text/lang_detection/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
34 |
-
data/datasets/lilac/enron-emails/text/near_dup/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
35 |
-
data/datasets/lilac/enron-emails/text/pii/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
36 |
-
data/datasets/lilac/mmlu_professional_law/choices/gte-small/hnsw.hnswlib.bin filter=lfs diff=lfs merge=lfs -text
|
37 |
-
data/datasets/lilac/mmlu_professional_law/choices/gte-small/hnsw.lookup.pkl filter=lfs diff=lfs merge=lfs -text
|
38 |
-
data/datasets/lilac/mmlu_professional_law/choices/gte-small/spans.pkl filter=lfs diff=lfs merge=lfs -text
|
39 |
-
data/datasets/lilac/mmlu_professional_law/choices/lang_detection/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
40 |
-
data/datasets/lilac/mmlu_professional_law/choices/near_dup/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
41 |
-
data/datasets/lilac/mmlu_professional_law/choices/pii/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
42 |
-
data/datasets/lilac/mmlu_professional_law/choices/text_statistics/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
43 |
-
data/datasets/lilac/mmlu_professional_law/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
44 |
-
data/datasets/lilac/mmlu_professional_law/question/gte-small/hnsw.hnswlib.bin filter=lfs diff=lfs merge=lfs -text
|
45 |
-
data/datasets/lilac/mmlu_professional_law/question/gte-small/hnsw.lookup.pkl filter=lfs diff=lfs merge=lfs -text
|
46 |
-
data/datasets/lilac/mmlu_professional_law/question/gte-small/spans.pkl filter=lfs diff=lfs merge=lfs -text
|
47 |
-
data/datasets/lilac/mmlu_professional_law/question/lang_detection/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
48 |
-
data/datasets/lilac/mmlu_professional_law/question/near_dup/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
49 |
-
data/datasets/lilac/mmlu_professional_law/question/pii/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
50 |
-
data/datasets/lilac/mmlu_professional_law/question/text_statistics/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
51 |
-
data/datasets/lilac/pile-of-law-r-legaladvice/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
52 |
-
data/datasets/lilac/pile-of-law-r-legaladvice/text/gte-small/hnsw.hnswlib.bin filter=lfs diff=lfs merge=lfs -text
|
53 |
-
data/datasets/lilac/pile-of-law-r-legaladvice/text/gte-small/hnsw.lookup.pkl filter=lfs diff=lfs merge=lfs -text
|
54 |
-
data/datasets/lilac/pile-of-law-r-legaladvice/text/gte-small/spans.pkl filter=lfs diff=lfs merge=lfs -text
|
55 |
-
data/datasets/lilac/pile-of-law-r-legaladvice/text/lang_detection/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
56 |
-
data/datasets/lilac/pile-of-law-r-legaladvice/text/near_dup/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
57 |
-
data/datasets/lilac/pile-of-law-r-legaladvice/text/pii/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
58 |
-
data/datasets/lilac/pile-of-law-r-legaladvice/text/text_statistics/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
59 |
-
data/datasets/lilac/open-asssistant-conversations/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
60 |
-
data/datasets/lilac/open-asssistant-conversations/text/gte-small/hnsw.hnswlib.bin filter=lfs diff=lfs merge=lfs -text
|
61 |
-
data/datasets/lilac/open-asssistant-conversations/text/gte-small/hnsw.lookup.pkl filter=lfs diff=lfs merge=lfs -text
|
62 |
-
data/datasets/lilac/open-asssistant-conversations/text/gte-small/spans.pkl filter=lfs diff=lfs merge=lfs -text
|
63 |
-
data/datasets/lilac/open-asssistant-conversations/text/lang_detection/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
64 |
-
data/datasets/lilac/open-asssistant-conversations/text/near_dup/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
65 |
-
data/datasets/lilac/open-asssistant-conversations/text/pii/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
66 |
-
data/datasets/lilac/open-asssistant-conversations/text/text_statistics/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
67 |
-
data/datasets/lilac/squad_v2/answers/text/lang_detection/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
68 |
-
data/datasets/lilac/squad_v2/answers/text/near_dup/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
69 |
-
data/datasets/lilac/squad_v2/answers/text/pii/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
70 |
-
data/datasets/lilac/squad_v2/answers/text/text_statistics/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
71 |
-
data/datasets/lilac/squad_v2/context/gte-small/hnsw.hnswlib.bin filter=lfs diff=lfs merge=lfs -text
|
72 |
-
data/datasets/lilac/squad_v2/context/gte-small/hnsw.lookup.pkl filter=lfs diff=lfs merge=lfs -text
|
73 |
-
data/datasets/lilac/squad_v2/context/gte-small/spans.pkl filter=lfs diff=lfs merge=lfs -text
|
74 |
-
data/datasets/lilac/squad_v2/context/lang_detection/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
75 |
-
data/datasets/lilac/squad_v2/context/near_dup/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
76 |
-
data/datasets/lilac/squad_v2/context/pii/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
77 |
-
data/datasets/lilac/squad_v2/context/text_statistics/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
78 |
-
data/datasets/lilac/squad_v2/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
79 |
-
data/datasets/lilac/squad_v2/question/lang_detection/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
80 |
-
data/datasets/lilac/squad_v2/question/near_dup/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
81 |
-
data/datasets/lilac/squad_v2/question/pii/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
82 |
-
data/datasets/lilac/squad_v2/question/text_statistics/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
83 |
-
data/datasets/lilac/imdb/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
84 |
-
data/datasets/lilac/imdb/text/gte-small/hnsw.hnswlib.bin filter=lfs diff=lfs merge=lfs -text
|
85 |
-
data/datasets/lilac/imdb/text/gte-small/hnsw.lookup.pkl filter=lfs diff=lfs merge=lfs -text
|
86 |
-
data/datasets/lilac/imdb/text/gte-small/spans.pkl filter=lfs diff=lfs merge=lfs -text
|
87 |
-
data/datasets/lilac/imdb/text/lang_detection/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
88 |
-
data/datasets/lilac/imdb/text/near_dup/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
89 |
-
data/datasets/lilac/imdb/text/pii/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
90 |
-
data/datasets/lilac/imdb/text/text_statistics/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
91 |
-
data/datasets/lilac/databricks-dolly-15k-curated-en/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
92 |
-
data/datasets/lilac/databricks-dolly-15k-curated-en/new-context/value/gte-small/hnsw.hnswlib.bin filter=lfs diff=lfs merge=lfs -text
|
93 |
-
data/datasets/lilac/databricks-dolly-15k-curated-en/original-context/gte-small/hnsw.hnswlib.bin filter=lfs diff=lfs merge=lfs -text
|
94 |
-
data/datasets/lilac/OpenOrca-100k/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
95 |
-
data/datasets/lilac/OpenOrca-100k/question/gte-small/hnsw.hnswlib.bin filter=lfs diff=lfs merge=lfs -text
|
96 |
-
data/datasets/lilac/OpenOrca-100k/question/gte-small/hnsw.lookup.pkl filter=lfs diff=lfs merge=lfs -text
|
97 |
-
data/datasets/lilac/OpenOrca-100k/question/gte-small/spans.pkl filter=lfs diff=lfs merge=lfs -text
|
98 |
-
data/datasets/lilac/OpenOrca-100k/question/lang_detection/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
99 |
-
data/datasets/lilac/OpenOrca-100k/question/near_dup/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
100 |
-
data/datasets/lilac/OpenOrca-100k/question/pii/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
101 |
-
data/datasets/lilac/OpenOrca-100k/question/text_statistics/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
102 |
-
data/datasets/lilac/OpenOrca-100k/response/gte-small/hnsw.hnswlib.bin filter=lfs diff=lfs merge=lfs -text
|
103 |
-
data/datasets/lilac/OpenOrca-100k/response/gte-small/hnsw.lookup.pkl filter=lfs diff=lfs merge=lfs -text
|
104 |
-
data/datasets/lilac/OpenOrca-100k/response/gte-small/spans.pkl filter=lfs diff=lfs merge=lfs -text
|
105 |
-
data/datasets/lilac/OpenOrca-100k/response/lang_detection/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
106 |
-
data/datasets/lilac/OpenOrca-100k/response/near_dup/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
107 |
-
data/datasets/lilac/OpenOrca-100k/response/pii/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
108 |
-
data/datasets/lilac/OpenOrca-100k/response/text_statistics/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
109 |
-
data/datasets/lilac/wikitext-2-raw-v1/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
110 |
-
data/datasets/lilac/wikitext-2-raw-v1/text/gte-small/hnsw.hnswlib.bin filter=lfs diff=lfs merge=lfs -text
|
111 |
-
data/datasets/lilac/wikitext-2-raw-v1/text/gte-small/hnsw.lookup.pkl filter=lfs diff=lfs merge=lfs -text
|
112 |
-
data/datasets/lilac/wikitext-2-raw-v1/text/gte-small/spans.pkl filter=lfs diff=lfs merge=lfs -text
|
113 |
-
data/datasets/lilac/wikitext-2-raw-v1/text/lang_detection/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
114 |
-
data/datasets/lilac/wikitext-2-raw-v1/text/near_dup/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
115 |
-
data/datasets/lilac/wikitext-2-raw-v1/text/pii/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
116 |
-
data/datasets/lilac/wikitext-2-raw-v1/text/text_statistics/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
data/.cache/lilac/concept/lilac/legal-termination/cohere.pkl
DELETED
Binary file (610 kB)
|
|
data/.cache/lilac/concept/lilac/legal-termination/gte-base.pkl
DELETED
Binary file (117 kB)
|
|
data/.cache/lilac/concept/lilac/legal-termination/gte-small.pkl
DELETED
Binary file (60.6 kB)
|
|
data/.cache/lilac/concept/lilac/legal-termination/openai.pkl
DELETED
Binary file (231 kB)
|
|
data/.cache/lilac/concept/lilac/legal-termination/palm.pkl
DELETED
Binary file (117 kB)
|
|
data/.cache/lilac/concept/lilac/legal-termination/sbert.pkl
DELETED
Binary file (60.6 kB)
|
|
data/.cache/lilac/concept/lilac/negative-sentiment/cohere.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:be0a6613703986f991d3795a6b3cfdccd40b75ce1c6cbf36e852403c8d8a6b7b
|
3 |
-
size 2088021
|
|
|
|
|
|
|
|
data/.cache/lilac/concept/lilac/negative-sentiment/gte-base.pkl
DELETED
Binary file (397 kB)
|
|
data/.cache/lilac/concept/lilac/negative-sentiment/gte-small.pkl
DELETED
Binary file (202 kB)
|
|
data/.cache/lilac/concept/lilac/negative-sentiment/openai.pkl
DELETED
Binary file (787 kB)
|
|
data/.cache/lilac/concept/lilac/negative-sentiment/palm.pkl
DELETED
Binary file (397 kB)
|
|
data/.cache/lilac/concept/lilac/negative-sentiment/sbert.pkl
DELETED
Binary file (202 kB)
|
|
data/.cache/lilac/concept/lilac/positive-sentiment/cohere.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:d654cd9eb459aba5509d6b21d48e2f2560c84457608a0ddefc0d7e26a685b7ef
|
3 |
-
size 1857652
|
|
|
|
|
|
|
|
data/.cache/lilac/concept/lilac/positive-sentiment/gte-base.pkl
DELETED
Binary file (353 kB)
|
|
data/.cache/lilac/concept/lilac/positive-sentiment/gte-small.pkl
DELETED
Binary file (180 kB)
|
|
data/.cache/lilac/concept/lilac/positive-sentiment/openai.pkl
DELETED
Binary file (700 kB)
|
|
data/.cache/lilac/concept/lilac/positive-sentiment/palm.pkl
DELETED
Binary file (353 kB)
|
|
data/.cache/lilac/concept/lilac/positive-sentiment/sbert.pkl
DELETED
Binary file (180 kB)
|
|
data/.cache/lilac/concept/lilac/profanity/cohere.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:0d68aeb0d88c4a501e21173ed3e5e53fa4998447ece6812d046c1c48b2595739
|
3 |
-
size 17413997
|
|
|
|
|
|
|
|
data/.cache/lilac/concept/lilac/profanity/gte-base.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:20c4454090ac980db7f02e5f2ff974b0fe75e26982c40e323891fae4b3785d38
|
3 |
-
size 3301326
|
|
|
|
|
|
|
|
data/.cache/lilac/concept/lilac/profanity/gte-small.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:ef20b176c6faec04280e7f4fcc5edfd01c8261b4838eab2955885a171e46590d
|
3 |
-
size 1672960
|
|
|
|
|
|
|
|
data/.cache/lilac/concept/lilac/profanity/openai.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:6a8e4c306cbbdbfa1d5dde1504fa67ee8e5ffa02ab77f1e8d06d15b9ea777398
|
3 |
-
size 6558076
|
|
|
|
|
|
|
|
data/.cache/lilac/concept/lilac/profanity/palm.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:0450ba56a6af797838a696e5d1046e84dbca2d6c6a00724c3bf403465980b1f5
|
3 |
-
size 3301322
|
|
|
|
|
|
|
|
data/.cache/lilac/concept/lilac/profanity/sbert.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:44f41da69be02fb8ffe4db5d7d16cdd0e8f4357f8147d4259ae5518863577087
|
3 |
-
size 1672951
|
|
|
|
|
|
|
|
data/.cache/lilac/concept/lilac/question/cohere.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:f933671c53af61a862ced9596326f52898f4ed827b917b66bca79d277ac8fc26
|
3 |
-
size 6254200
|
|
|
|
|
|
|
|
data/.cache/lilac/concept/lilac/question/gte-base.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:aca30e4e5781f3c41b1390d7957ade2e0ab8ba7fa7c0ab86a6adada968ff0875
|
3 |
-
size 1194951
|
|
|
|
|
|
|
|
data/.cache/lilac/concept/lilac/question/gte-small.pkl
DELETED
Binary file (611 kB)
|
|
data/.cache/lilac/concept/lilac/question/openai.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:f22a5242b5e77afc904217cc659e28e8aabf4faacfe68c32ca8a1b64779c5359
|
3 |
-
size 2362458
|
|
|
|
|
|
|
|
data/.cache/lilac/concept/lilac/question/palm.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:54afeddb816e97f3d5dbcf86c5603826ac34ca7bf585e33ad369a7d5e3edd45a
|
3 |
-
size 1194947
|
|
|
|
|
|
|
|
data/.cache/lilac/concept/lilac/question/sbert.pkl
DELETED
Binary file (611 kB)
|
|
data/.cache/lilac/concept/lilac/source-code/cohere.pkl
DELETED
Binary file (610 kB)
|
|
data/.cache/lilac/concept/lilac/source-code/gte-base.pkl
DELETED
Binary file (117 kB)
|
|
data/.cache/lilac/concept/lilac/source-code/gte-small.pkl
DELETED
Binary file (60.6 kB)
|
|
data/.cache/lilac/concept/lilac/source-code/openai.pkl
DELETED
Binary file (231 kB)
|
|
data/.cache/lilac/concept/lilac/source-code/palm.pkl
DELETED
Binary file (117 kB)
|
|
data/.cache/lilac/concept/lilac/source-code/sbert.pkl
DELETED
Binary file (60.6 kB)
|
|
data/.cache/lilac/concept/lilac/toxicity/cohere.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:8ec3b151a149f0664813f50ba599001bc3a44cc7b6f8c35a48e213ee9c9682fb
|
3 |
-
size 19602537
|
|
|
|
|
|
|
|
data/.cache/lilac/concept/lilac/toxicity/gte-base.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:bd428cfda7f66401cf3b6ec9f1b356c3e0d79ab5bce8675c271e562c24de3580
|
3 |
-
size 3719127
|
|
|
|
|
|
|
|
data/.cache/lilac/concept/lilac/toxicity/gte-small.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:b9bab578121263c97f51049e82846b7b517b79655bfd9b6ad5fe861dbefd1212
|
3 |
-
size 1886446
|
|
|
|
|
|
|
|
data/.cache/lilac/concept/lilac/toxicity/openai.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:4e9be59c226a117c78c32cdb0f4befaf771b74a7af820af25f86053e1cf80614
|
3 |
-
size 7384512
|
|
|
|
|
|
|
|
data/.cache/lilac/concept/lilac/toxicity/palm.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:b334cd21b80823eb0b7a6c177ba2f6ed8cadc504b642e7b89481f0e583dcfece
|
3 |
-
size 3719128
|
|
|
|
|
|
|
|
data/.cache/lilac/concept/lilac/toxicity/sbert.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:64540327c019de743fa40b494f21cf1a5a7b0af80df6243eb44b56cf3810ccbf
|
3 |
-
size 1886440
|
|
|
|
|
|
|
|
data/datasets/lilac/OpenOrca-100k/config.yml
DELETED
@@ -1,28 +0,0 @@
|
|
1 |
-
embeddings:
|
2 |
-
- {embedding: gte-small, path: response}
|
3 |
-
- {embedding: gte-small, path: question}
|
4 |
-
name: OpenOrca-100k
|
5 |
-
namespace: local
|
6 |
-
settings:
|
7 |
-
preferred_embedding: gte-small
|
8 |
-
ui:
|
9 |
-
media_paths: [question, response]
|
10 |
-
signals:
|
11 |
-
- path: question
|
12 |
-
signal: {signal_name: near_dup}
|
13 |
-
- path: question
|
14 |
-
signal: {signal_name: text_statistics}
|
15 |
-
- path: question
|
16 |
-
signal: {signal_name: pii}
|
17 |
-
- path: question
|
18 |
-
signal: {signal_name: lang_detection}
|
19 |
-
- path: response
|
20 |
-
signal: {signal_name: near_dup}
|
21 |
-
- path: response
|
22 |
-
signal: {signal_name: text_statistics}
|
23 |
-
- path: response
|
24 |
-
signal: {signal_name: pii}
|
25 |
-
- path: response
|
26 |
-
signal: {signal_name: lang_detection}
|
27 |
-
source: {dataset_name: Open-Orca/OpenOrca, sample_size: 100000, source_name: huggingface}
|
28 |
-
tags: [machine-learning]
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
data/datasets/lilac/OpenOrca-100k/data-00000-of-00001.parquet
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:f95588367446af55ccc2f089092779670c57308ee1f72a849e41f22e126d5052
|
3 |
-
size 105147761
|
|
|
|
|
|
|
|
data/datasets/lilac/OpenOrca-100k/manifest.json
DELETED
@@ -1,24 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"files": [
|
3 |
-
"data-00000-of-00001.parquet"
|
4 |
-
],
|
5 |
-
"data_schema": {
|
6 |
-
"fields": {
|
7 |
-
"id": {
|
8 |
-
"dtype": "string"
|
9 |
-
},
|
10 |
-
"system_prompt": {
|
11 |
-
"dtype": "string"
|
12 |
-
},
|
13 |
-
"question": {
|
14 |
-
"dtype": "string"
|
15 |
-
},
|
16 |
-
"response": {
|
17 |
-
"dtype": "string"
|
18 |
-
},
|
19 |
-
"__hfsplit__": {
|
20 |
-
"dtype": "string"
|
21 |
-
}
|
22 |
-
}
|
23 |
-
}
|
24 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
data/datasets/lilac/OpenOrca-100k/question/gte-small/hnsw.hnswlib.bin
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:5dfe25276925e77c354a88ae5a6f19bcfc4f9b5e8b040848ae0769d05c9609d7
|
3 |
-
size 596705084
|
|
|
|
|
|
|
|
data/datasets/lilac/OpenOrca-100k/question/gte-small/hnsw.lookup.pkl
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:3c0bac1790aa5247eb288c2a828a92eb313090b36a015665f6aae42e5a4dcb18
|
3 |
-
size 9378299
|
|
|
|
|
|
|
|
data/datasets/lilac/OpenOrca-100k/question/gte-small/signal_manifest.json
DELETED
@@ -1,32 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"files": [],
|
3 |
-
"parquet_id": "question.gte-small",
|
4 |
-
"data_schema": {
|
5 |
-
"fields": {
|
6 |
-
"question": {
|
7 |
-
"fields": {
|
8 |
-
"gte-small": {
|
9 |
-
"repeated_field": {
|
10 |
-
"fields": {
|
11 |
-
"embedding": {
|
12 |
-
"dtype": "embedding"
|
13 |
-
}
|
14 |
-
},
|
15 |
-
"dtype": "string_span"
|
16 |
-
},
|
17 |
-
"signal": {
|
18 |
-
"signal_name": "gte-small"
|
19 |
-
}
|
20 |
-
}
|
21 |
-
}
|
22 |
-
}
|
23 |
-
}
|
24 |
-
},
|
25 |
-
"signal": {
|
26 |
-
"signal_name": "gte-small"
|
27 |
-
},
|
28 |
-
"enriched_path": [
|
29 |
-
"question"
|
30 |
-
],
|
31 |
-
"vector_store": "hnsw"
|
32 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|