67
Browse files
app/data/shakespeare_char/prepare.py
CHANGED
@@ -46,16 +46,17 @@ print(f"train has {len(train_ids):,} tokens")
|
|
46 |
print(f"val has {len(val_ids):,} tokens")
|
47 |
|
48 |
# export to bin files
|
49 |
-
permissions = 0o755
|
50 |
train_ids = np.array(train_ids, dtype=np.uint16)
|
51 |
val_ids = np.array(val_ids, dtype=np.uint16)
|
52 |
-
|
53 |
-
|
54 |
-
|
55 |
-
|
56 |
-
|
57 |
-
|
58 |
-
|
|
|
|
|
59 |
|
60 |
# save the meta information as well, to help us encode/decode later
|
61 |
meta = {
|
|
|
46 |
print(f"val has {len(val_ids):,} tokens")
|
47 |
|
48 |
# export to bin files
|
|
|
49 |
train_ids = np.array(train_ids, dtype=np.uint16)
|
50 |
val_ids = np.array(val_ids, dtype=np.uint16)
|
51 |
+
|
52 |
+
file_path_train = os.path.join(os.path.dirname(__file__), 'train.bin')
|
53 |
+
file_path_val = os.path.join(os.path.dirname(__file__), 'val.bin')
|
54 |
+
permissions = 0o755
|
55 |
+
os.chmod(file_path_train, permissions)
|
56 |
+
os.chmod(file_path_val, permissions)
|
57 |
+
|
58 |
+
train_ids.tofile(os.path.join(os.path.dirname(__file__), 'train.bin'))
|
59 |
+
val_ids.tofile(os.path.join(os.path.dirname(__file__), 'val.bin'))
|
60 |
|
61 |
# save the meta information as well, to help us encode/decode later
|
62 |
meta = {
|