Upload folder using huggingface_hub
Browse files
.gitattributes
CHANGED
@@ -12,3 +12,4 @@ data/datasets/lilac/piqa/sol1/gte-small/spans.pkl filter=lfs diff=lfs merge=lfs
|
|
12 |
data/datasets/lilac/piqa/sol2/gte-small/hnsw.hnswlib.bin filter=lfs diff=lfs merge=lfs -text
|
13 |
data/datasets/lilac/piqa/sol2/gte-small/hnsw.lookup.pkl filter=lfs diff=lfs merge=lfs -text
|
14 |
data/datasets/lilac/piqa/sol2/gte-small/spans.pkl filter=lfs diff=lfs merge=lfs -text
|
|
|
|
12 |
data/datasets/lilac/piqa/sol2/gte-small/hnsw.hnswlib.bin filter=lfs diff=lfs merge=lfs -text
|
13 |
data/datasets/lilac/piqa/sol2/gte-small/hnsw.lookup.pkl filter=lfs diff=lfs merge=lfs -text
|
14 |
data/datasets/lilac/piqa/sol2/gte-small/spans.pkl filter=lfs diff=lfs merge=lfs -text
|
15 |
+
data/datasets/lilac/pile-of-law-atticus-contracts/data-00000-of-00001.parquet filter=lfs diff=lfs merge=lfs -text
|
data/datasets/lilac/pile-of-law-atticus-contracts/config.yml
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
name: pile-of-law-atticus-contracts
|
2 |
+
namespace: lilac
|
3 |
+
settings:
|
4 |
+
preferred_embedding: gte-small
|
5 |
+
ui:
|
6 |
+
media_paths:
|
7 |
+
- text
|
8 |
+
source:
|
9 |
+
config_name: atticus_contracts
|
10 |
+
dataset_name: pile-of-law/pile-of-law
|
11 |
+
sample_size: 100000
|
12 |
+
source_name: huggingface
|
13 |
+
tags:
|
14 |
+
- legal
|
data/datasets/lilac/pile-of-law-atticus-contracts/data-00000-of-00001.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:654fd626e1d336406da59fd0efe676c91e58c3752fa0bf668523df6872d2b131
|
3 |
+
size 4778681829
|
data/datasets/lilac/pile-of-law-atticus-contracts/manifest.json
ADDED
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"files": [
|
3 |
+
"data-00000-of-00001.parquet"
|
4 |
+
],
|
5 |
+
"data_schema": {
|
6 |
+
"fields": {
|
7 |
+
"text": {
|
8 |
+
"dtype": "string"
|
9 |
+
},
|
10 |
+
"created_timestamp": {
|
11 |
+
"dtype": "string"
|
12 |
+
},
|
13 |
+
"downloaded_timestamp": {
|
14 |
+
"dtype": "string"
|
15 |
+
},
|
16 |
+
"url": {
|
17 |
+
"dtype": "string"
|
18 |
+
},
|
19 |
+
"__hfsplit__": {
|
20 |
+
"dtype": "string"
|
21 |
+
},
|
22 |
+
"__rowid__": {
|
23 |
+
"dtype": "string"
|
24 |
+
}
|
25 |
+
}
|
26 |
+
}
|
27 |
+
}
|