krish-emissary commited on
Commit
874b6ca
·
verified ·
1 Parent(s): b6f2cad

Add files using upload-large-folder tool

Browse files
Files changed (20) hide show
  1. emissary-ml/llm-scripts/fine-tuning/llama3/gpu_monitoring.py +134 -0
  2. emissary-ml/llm-scripts/fine-tuning/llama3/test_script.py +1 -0
  3. emissary-ml/llm-scripts/fine-tuning/llama3/venv/share/jupyter/labextensions/@jupyter-notebook/lab-extension/package.json +109 -0
  4. emissary-ml/llm-scripts/fine-tuning/llama3/venv/share/jupyter/labextensions/@jupyter-notebook/lab-extension/static/style.js +4 -0
  5. emissary-ml/llm-scripts/fine-tuning/llama3/venv/share/jupyter/labextensions/jupyterlab_pygments/package.json +205 -0
  6. emissary-ml/llm-scripts/fine-tuning/llama3/venv/share/jupyter/nbconvert/templates/base/cell_id_anchor.j2 +5 -0
  7. emissary-ml/llm-scripts/fine-tuning/llama3/venv/share/jupyter/nbconvert/templates/base/display_priority.j2 +49 -0
  8. emissary-ml/llm-scripts/fine-tuning/llama3/venv/share/jupyter/nbconvert/templates/base/null.j2 +111 -0
  9. emissary-ml/llm-scripts/fine-tuning/llama3/venv/share/jupyter/nbconvert/templates/reveal/index.html.j2 +194 -0
  10. emissary-ml/llm-scripts/fine-tuning/llama3/venv/share/jupyter/nbconvert/templates/reveal/static/custom_reveal.css +121 -0
  11. emissary-ml/llm-scripts/fine-tuning/llama3/venv/share/jupyter/nbconvert/templates/rst/conf.json +6 -0
  12. emissary-ml/llm-scripts/fine-tuning/llama3/venv/share/jupyter/nbconvert/templates/rst/index.rst.j2 +117 -0
  13. emissary-ml/llm-scripts/fine-tuning/llama3/wandb/debug.log +34 -0
  14. emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_231120-bt4spvmx/files/wandb-metadata.json +741 -0
  15. emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_231120-bt4spvmx/files/wandb-summary.json +1 -0
  16. emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_231120-bt4spvmx/logs/debug.log +34 -0
  17. emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233312-jyfpuk9c/run-jyfpuk9c.wandb +0 -0
  18. emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/config.yaml +46 -0
  19. emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/wandb-summary.json +1 -0
  20. emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/logs/debug-internal.log +184 -0
emissary-ml/llm-scripts/fine-tuning/llama3/gpu_monitoring.py ADDED
@@ -0,0 +1,134 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #!/usr/bin/env python3
2
+ """
3
+ GPU Memory Monitoring Script for Model Parallelization Experiments
4
+ """
5
+
6
+ import subprocess
7
+ import time
8
+ import csv
9
+ import datetime
10
+ import argparse
11
+
12
+
13
+ def get_gpu_memory_info():
14
+ """Get current GPU memory usage using nvidia-smi"""
15
+ try:
16
+ result = subprocess.run(
17
+ ['nvidia-smi', '--query-gpu=index,name,memory.used,memory.total,utilization.gpu',
18
+ '--format=csv,noheader,nounits'],
19
+ capture_output=True, text=True, check=True
20
+ )
21
+
22
+ gpu_info = []
23
+ for line in result.stdout.strip().split('\n'):
24
+ parts = line.split(', ')
25
+ gpu_info.append({
26
+ 'index': int(parts[0]),
27
+ 'name': parts[1],
28
+ 'memory_used_mb': int(parts[2]),
29
+ 'memory_total_mb': int(parts[3]),
30
+ 'gpu_utilization': int(parts[4])
31
+ })
32
+ return gpu_info
33
+ except Exception as e:
34
+ print(f"Error getting GPU info: {e}")
35
+ return []
36
+
37
+ def monitor_gpus(output_file, interval=5, experiment_name=""):
38
+ """Monitor GPU memory usage and save to CSV"""
39
+
40
+ with open(output_file, 'w', newline='') as csvfile:
41
+ fieldnames = ['timestamp', 'experiment', 'gpu_index', 'gpu_name',
42
+ 'memory_used_mb', 'memory_total_mb', 'memory_percent',
43
+ 'gpu_utilization']
44
+ writer = csv.DictWriter(csvfile, fieldnames=fieldnames)
45
+ writer.writeheader()
46
+
47
+ print(f"Starting GPU monitoring for experiment: {experiment_name}")
48
+ print(f"Writing to: {output_file}")
49
+ print("Press Ctrl+C to stop monitoring\n")
50
+
51
+ try:
52
+ while True:
53
+ timestamp = datetime.datetime.now().isoformat()
54
+ gpu_infos = get_gpu_memory_info()
55
+
56
+ for gpu in gpu_infos:
57
+ memory_percent = (gpu['memory_used_mb'] / gpu['memory_total_mb']) * 100
58
+
59
+ writer.writerow({
60
+ 'timestamp': timestamp,
61
+ 'experiment': experiment_name,
62
+ 'gpu_index': gpu['index'],
63
+ 'gpu_name': gpu['name'],
64
+ 'memory_used_mb': gpu['memory_used_mb'],
65
+ 'memory_total_mb': gpu['memory_total_mb'],
66
+ 'memory_percent': f"{memory_percent:.2f}",
67
+ 'gpu_utilization': gpu['gpu_utilization']
68
+ })
69
+
70
+ print(f"GPU {gpu['index']}: {gpu['memory_used_mb']}/{gpu['memory_total_mb']} MB "
71
+ f"({memory_percent:.1f}%) | Util: {gpu['gpu_utilization']}%")
72
+
73
+ print("-" * 80)
74
+ csvfile.flush()
75
+ time.sleep(interval)
76
+
77
+ except KeyboardInterrupt:
78
+ print("\nMonitoring stopped.")
79
+
80
+ def analyze_log(log_file):
81
+ """Analyze the monitoring log and produce summary statistics"""
82
+ data = []
83
+ with open(log_file, 'r') as f:
84
+ reader = csv.DictReader(f)
85
+ for row in reader:
86
+ row['memory_used_mb'] = int(row['memory_used_mb'])
87
+ row['memory_total_mb'] = int(row['memory_total_mb'])
88
+ row['memory_percent'] = float(row['memory_percent'])
89
+ row['gpu_utilization'] = int(row['gpu_utilization'])
90
+ data.append(row)
91
+
92
+ if not data:
93
+ print("No data found in log file")
94
+ return
95
+
96
+ # Group by GPU
97
+ gpus = {}
98
+ for row in data:
99
+ gpu_idx = row['gpu_index']
100
+ if gpu_idx not in gpus:
101
+ gpus[gpu_idx] = []
102
+ gpus[gpu_idx].append(row)
103
+
104
+ print(f"\nAnalysis of {log_file}:")
105
+ print("=" * 80)
106
+
107
+ for gpu_idx, gpu_data in sorted(gpus.items()):
108
+ memory_used = [d['memory_used_mb'] for d in gpu_data]
109
+ memory_percent = [d['memory_percent'] for d in gpu_data]
110
+ gpu_util = [d['gpu_utilization'] for d in gpu_data]
111
+
112
+ print(f"\nGPU {gpu_idx} ({gpu_data[0]['gpu_name']}):")
113
+ print(f" Memory - Max: {max(memory_used)} MB ({max(memory_percent):.1f}%)")
114
+ print(f" Memory - Avg: {sum(memory_used)/len(memory_used):.0f} MB ({sum(memory_percent)/len(memory_percent):.1f}%)")
115
+ print(f" GPU Util - Max: {max(gpu_util)}%")
116
+ print(f" GPU Util - Avg: {sum(gpu_util)/len(gpu_util):.1f}%")
117
+
118
+ if __name__ == "__main__":
119
+ parser = argparse.ArgumentParser(description='GPU Memory Monitor for ML Experiments')
120
+ parser.add_argument('--output', '-o', default='gpu_monitor.csv',
121
+ help='Output CSV file')
122
+ parser.add_argument('--interval', '-i', type=int, default=5,
123
+ help='Monitoring interval in seconds')
124
+ parser.add_argument('--experiment', '-e', default='',
125
+ help='Experiment name/description')
126
+ parser.add_argument('--analyze', '-a',
127
+ help='Analyze existing log file instead of monitoring')
128
+
129
+ args = parser.parse_args()
130
+
131
+ if args.analyze:
132
+ analyze_log(args.analyze)
133
+ else:
134
+ monitor_gpus(args.output, args.interval, args.experiment)
emissary-ml/llm-scripts/fine-tuning/llama3/test_script.py ADDED
@@ -0,0 +1 @@
 
 
1
+ test_functions = {}
emissary-ml/llm-scripts/fine-tuning/llama3/venv/share/jupyter/labextensions/@jupyter-notebook/lab-extension/package.json ADDED
@@ -0,0 +1,109 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "@jupyter-notebook/lab-extension",
3
+ "version": "7.4.2",
4
+ "description": "Jupyter Notebook - Lab Extension",
5
+ "homepage": "https://github.com/jupyter/notebook",
6
+ "bugs": {
7
+ "url": "https://github.com/jupyter/notebook/issues"
8
+ },
9
+ "repository": {
10
+ "type": "git",
11
+ "url": "https://github.com/jupyter/notebook.git"
12
+ },
13
+ "license": "BSD-3-Clause",
14
+ "author": "Project Jupyter",
15
+ "sideEffects": [
16
+ "style/**/*.css",
17
+ "style/index.js"
18
+ ],
19
+ "main": "lib/index.js",
20
+ "types": "lib/index.d.ts",
21
+ "style": "style/index.css",
22
+ "directories": {
23
+ "lib": "lib/"
24
+ },
25
+ "files": [
26
+ "lib/*.d.ts",
27
+ "lib/*.js.map",
28
+ "lib/*.js",
29
+ "schema/*.json",
30
+ "style/index.js"
31
+ ],
32
+ "scripts": {
33
+ "build": "jlpm run build:labextension:dev",
34
+ "build:labextension": "jupyter labextension build .",
35
+ "build:labextension:dev": "jupyter labextension build --development True .",
36
+ "build:lib": "tsc -b",
37
+ "build:prod": "jlpm run build:labextension",
38
+ "clean": "jlpm run clean:lib && jlpm run clean:labextension",
39
+ "clean:labextension": "rimraf ../../notebook/labextension",
40
+ "clean:lib": "rimraf lib tsconfig.tsbuildinfo",
41
+ "watch": "run-p watch:src watch:labextension",
42
+ "watch:labextension": "jupyter labextension watch .",
43
+ "watch:src": "tsc -w"
44
+ },
45
+ "dependencies": {
46
+ "@jupyter-notebook/application": "^7.4.2",
47
+ "@jupyterlab/application": "~4.4.2",
48
+ "@jupyterlab/apputils": "~4.5.2",
49
+ "@jupyterlab/coreutils": "~6.4.2",
50
+ "@jupyterlab/docregistry": "~4.4.2",
51
+ "@jupyterlab/notebook": "~4.4.2",
52
+ "@jupyterlab/translation": "~4.4.2",
53
+ "@jupyterlab/ui-components": "~4.4.2",
54
+ "@lumino/commands": "^2.3.2",
55
+ "@lumino/disposable": "^2.1.4"
56
+ },
57
+ "devDependencies": {
58
+ "@jupyterlab/builder": "~4.4.2",
59
+ "rimraf": "^3.0.2",
60
+ "typescript": "~5.5.4"
61
+ },
62
+ "publishConfig": {
63
+ "access": "public"
64
+ },
65
+ "jupyterlab": {
66
+ "extension": true,
67
+ "outputDir": "../../notebook/labextension",
68
+ "schemaDir": "schema",
69
+ "_build": {
70
+ "load": "static/remoteEntry.a7f6d6f20e99b7f1c604.js",
71
+ "extension": "./extension",
72
+ "style": "./style"
73
+ }
74
+ },
75
+ "nx": {
76
+ "targets": {
77
+ "build:labextension:dev": {
78
+ "dependsOn": [
79
+ "^build:lib",
80
+ "build:lib"
81
+ ],
82
+ "outputs": [
83
+ "{workspaceRoot}/notebook/labextension",
84
+ "{workspaceRoot}/notebook/labextension/build_log.json"
85
+ ]
86
+ },
87
+ "build:labextension": {
88
+ "dependsOn": [
89
+ "^build:lib",
90
+ "build:lib"
91
+ ],
92
+ "outputs": [
93
+ "{workspaceRoot}/notebook/labextension"
94
+ ]
95
+ },
96
+ "build": {
97
+ "dependsOn": [
98
+ "build:labextension:dev"
99
+ ]
100
+ },
101
+ "build:prod": {
102
+ "dependsOn": [
103
+ "build:labextension"
104
+ ]
105
+ }
106
+ }
107
+ },
108
+ "styleModule": "style/index.js"
109
+ }
emissary-ml/llm-scripts/fine-tuning/llama3/venv/share/jupyter/labextensions/@jupyter-notebook/lab-extension/static/style.js ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ /* This is a generated file of CSS imports */
2
+ /* It was generated by @jupyterlab/builder in Build.ensureAssets() */
3
+
4
+ import '@jupyter-notebook/lab-extension/style/index.js';
emissary-ml/llm-scripts/fine-tuning/llama3/venv/share/jupyter/labextensions/jupyterlab_pygments/package.json ADDED
@@ -0,0 +1,205 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "name": "jupyterlab_pygments",
3
+ "version": "0.3.0",
4
+ "description": "Pygments theme using JupyterLab CSS variables",
5
+ "keywords": [
6
+ "jupyter",
7
+ "jupyterlab",
8
+ "jupyterlab-extension"
9
+ ],
10
+ "homepage": "https://github.com/jupyterlab/jupyterlab_pygments",
11
+ "bugs": {
12
+ "url": "https://github.com/jupyterlab/jupyterlab_pygments/issues"
13
+ },
14
+ "license": "BSD-3-Clause",
15
+ "author": {
16
+ "name": "Jupyter Development Team",
17
+ "email": "[email protected]"
18
+ },
19
+ "files": [
20
+ "lib/**/*.{d.ts,eot,gif,html,jpg,js,js.map,json,png,svg,woff2,ttf}",
21
+ "style/**/*.{css,js,eot,gif,html,jpg,json,png,svg,woff2,ttf}",
22
+ "style/index.js"
23
+ ],
24
+ "main": "lib/index.js",
25
+ "types": "lib/index.d.ts",
26
+ "style": "style/index.css",
27
+ "repository": {
28
+ "type": "git",
29
+ "url": "https://github.com/jupyterlab/jupyterlab_pygments.git"
30
+ },
31
+ "scripts": {
32
+ "build": "jlpm build:css && jlpm build:lib && jlpm build:labextension:dev",
33
+ "build:css": "python generate_css.py",
34
+ "build:labextension": "jupyter labextension build .",
35
+ "build:labextension:dev": "jupyter labextension build --development True .",
36
+ "build:lib": "tsc",
37
+ "build:prod": "jlpm clean && jlpm build:css && jlpm build:lib && jlpm build:labextension",
38
+ "clean": "jlpm clean:lib",
39
+ "clean:all": "jlpm clean:lib && jlpm clean:labextension && jlpm clean:lintcache",
40
+ "clean:labextension": "rimraf jupyterlab_pygments/labextension",
41
+ "clean:lib": "rimraf lib tsconfig.tsbuildinfo style/base.css",
42
+ "clean:lintcache": "rimraf .eslintcache .stylelintcache",
43
+ "eslint": "jlpm eslint:check --fix",
44
+ "eslint:check": "eslint . --cache --ext .ts,.tsx",
45
+ "install:extension": "jlpm build",
46
+ "lint": "jlpm stylelint && jlpm prettier && jlpm eslint",
47
+ "lint:check": "jlpm stylelint:check && jlpm prettier:check && jlpm eslint:check",
48
+ "prettier": "jlpm prettier:base --write --list-different",
49
+ "prettier:base": "prettier \"**/*{.ts,.tsx,.js,.jsx,.css,.json,.md}\"",
50
+ "prettier:check": "jlpm prettier:base --check",
51
+ "stylelint": "jlpm stylelint:check --fix",
52
+ "stylelint:check": "stylelint --cache \"style/**/*.css\"",
53
+ "watch": "run-p watch:src watch:labextension",
54
+ "watch:labextension": "jupyter labextension watch .",
55
+ "watch:src": "tsc -w"
56
+ },
57
+ "dependencies": {
58
+ "@jupyterlab/application": "^4.0.8",
59
+ "@types/node": "^20.9.0"
60
+ },
61
+ "devDependencies": {
62
+ "@jupyterlab/builder": "^4.0.0",
63
+ "@types/json-schema": "^7.0.11",
64
+ "@types/react": "^18.0.26",
65
+ "@types/react-addons-linked-state-mixin": "^0.14.22",
66
+ "@typescript-eslint/eslint-plugin": "^6.1.0",
67
+ "@typescript-eslint/parser": "^6.1.0",
68
+ "css-loader": "^6.7.1",
69
+ "eslint": "^8.36.0",
70
+ "eslint-config-prettier": "^8.8.0",
71
+ "eslint-plugin-prettier": "^5.0.0",
72
+ "npm-run-all": "^4.1.5",
73
+ "prettier": "3.0.3",
74
+ "rimraf": "^5.0.5",
75
+ "source-map-loader": "^1.0.2",
76
+ "style-loader": "^3.3.1",
77
+ "stylelint": "^15.10.1",
78
+ "stylelint-config-prettier": "^9.0.3",
79
+ "stylelint-config-recommended": "^13.0.0",
80
+ "stylelint-config-standard": "^34.0.0",
81
+ "stylelint-csstree-validator": "^3.0.0",
82
+ "stylelint-prettier": "^4.0.0",
83
+ "typescript": "~5.0.2",
84
+ "yjs": "^13.5.40"
85
+ },
86
+ "sideEffects": [
87
+ "style/*.css",
88
+ "style/index.js"
89
+ ],
90
+ "styleModule": "style/index.js",
91
+ "publishConfig": {
92
+ "access": "public"
93
+ },
94
+ "jupyterlab": {
95
+ "extension": true,
96
+ "outputDir": "jupyterlab_pygments/labextension",
97
+ "_build": {
98
+ "load": "static/remoteEntry.5cbb9d2323598fbda535.js",
99
+ "extension": "./extension",
100
+ "style": "./style"
101
+ }
102
+ },
103
+ "jupyter-releaser": {
104
+ "hooks": {
105
+ "before-build-npm": [
106
+ "python -m pip install jupyterlab~=3.1",
107
+ "jlpm"
108
+ ],
109
+ "before-build-python": [
110
+ "jlpm clean:all"
111
+ ]
112
+ }
113
+ },
114
+ "eslintConfig": {
115
+ "extends": [
116
+ "eslint:recommended",
117
+ "plugin:@typescript-eslint/eslint-recommended",
118
+ "plugin:@typescript-eslint/recommended",
119
+ "plugin:prettier/recommended"
120
+ ],
121
+ "parser": "@typescript-eslint/parser",
122
+ "parserOptions": {
123
+ "project": "tsconfig.json",
124
+ "sourceType": "module"
125
+ },
126
+ "plugins": [
127
+ "@typescript-eslint"
128
+ ],
129
+ "rules": {
130
+ "@typescript-eslint/naming-convention": [
131
+ "error",
132
+ {
133
+ "selector": "interface",
134
+ "format": [
135
+ "PascalCase"
136
+ ],
137
+ "custom": {
138
+ "regex": "^I[A-Z]",
139
+ "match": true
140
+ }
141
+ }
142
+ ],
143
+ "@typescript-eslint/no-unused-vars": [
144
+ "warn",
145
+ {
146
+ "args": "none"
147
+ }
148
+ ],
149
+ "@typescript-eslint/no-explicit-any": "off",
150
+ "@typescript-eslint/no-namespace": "off",
151
+ "@typescript-eslint/no-use-before-define": "off",
152
+ "@typescript-eslint/quotes": [
153
+ "error",
154
+ "single",
155
+ {
156
+ "avoidEscape": true,
157
+ "allowTemplateLiterals": false
158
+ }
159
+ ],
160
+ "curly": [
161
+ "error",
162
+ "all"
163
+ ],
164
+ "eqeqeq": "error",
165
+ "prefer-arrow-callback": "error"
166
+ }
167
+ },
168
+ "eslintIgnore": [
169
+ "node_modules",
170
+ "dist",
171
+ "coverage",
172
+ "**/*.d.ts"
173
+ ],
174
+ "prettier": {
175
+ "singleQuote": true,
176
+ "trailingComma": "none",
177
+ "arrowParens": "avoid",
178
+ "endOfLine": "auto",
179
+ "overrides": [
180
+ {
181
+ "files": "package.json",
182
+ "options": {
183
+ "tabWidth": 4
184
+ }
185
+ }
186
+ ]
187
+ },
188
+ "stylelint": {
189
+ "extends": [
190
+ "stylelint-config-recommended",
191
+ "stylelint-config-standard",
192
+ "stylelint-prettier/recommended"
193
+ ],
194
+ "plugins": [
195
+ "stylelint-csstree-validator"
196
+ ],
197
+ "rules": {
198
+ "csstree/validator": true,
199
+ "property-no-vendor-prefix": null,
200
+ "selector-class-pattern": "^([a-z][A-z\\d]*)(-[A-z\\d]+)*$",
201
+ "selector-no-vendor-prefix": null,
202
+ "value-no-vendor-prefix": null
203
+ }
204
+ }
205
+ }
emissary-ml/llm-scripts/fine-tuning/llama3/venv/share/jupyter/nbconvert/templates/base/cell_id_anchor.j2 ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {%- macro cell_id_anchor(cell) -%}
2
+ {% if cell.id | length > 0 -%}
3
+ id="{{ ('cell-id=' ~ cell.id) | escape_html -}}"
4
+ {%- endif %}
5
+ {%- endmacro %}
emissary-ml/llm-scripts/fine-tuning/llama3/venv/share/jupyter/nbconvert/templates/base/display_priority.j2 ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {%- extends 'base/null.j2' -%}
2
+
3
+ {#display data priority#}
4
+
5
+
6
+ {%- block data_priority scoped -%}
7
+ {%- for type in output.data | filter_data_type -%}
8
+ {%- if type == 'application/pdf' -%}
9
+ {%- block data_pdf -%}
10
+ {%- endblock -%}
11
+ {%- elif type == 'image/svg+xml' -%}
12
+ {%- block data_svg -%}
13
+ {%- endblock -%}
14
+ {%- elif type == 'image/png' -%}
15
+ {%- block data_png -%}
16
+ {%- endblock -%}
17
+ {%- elif type == 'text/html' -%}
18
+ {%- block data_html -%}
19
+ {%- endblock -%}
20
+ {%- elif type == 'text/markdown' -%}
21
+ {%- block data_markdown -%}
22
+ {%- endblock -%}
23
+ {%- elif type == 'image/jpeg' -%}
24
+ {%- block data_jpg -%}
25
+ {%- endblock -%}
26
+ {%- elif type == 'text/plain' -%}
27
+ {%- block data_text -%}
28
+ {%- endblock -%}
29
+ {%- elif type == 'text/latex' -%}
30
+ {%- block data_latex -%}
31
+ {%- endblock -%}
32
+ {%- elif type == 'text/vnd.mermaid' -%}
33
+ {%- block data_mermaid -%}
34
+ {%- endblock -%}
35
+ {%- elif type == 'application/javascript' -%}
36
+ {%- block data_javascript -%}
37
+ {%- endblock -%}
38
+ {%- elif type == 'application/vnd.jupyter.widget-view+json' -%}
39
+ {%- block data_widget_view -%}
40
+ {%- endblock -%}
41
+ {%- elif type == resources.output_mimetype -%}
42
+ {%- block data_native -%}
43
+ {%- endblock -%}
44
+ {%- else -%}
45
+ {%- block data_other -%}
46
+ {%- endblock -%}
47
+ {%- endif -%}
48
+ {%- endfor -%}
49
+ {%- endblock data_priority -%}
emissary-ml/llm-scripts/fine-tuning/llama3/venv/share/jupyter/nbconvert/templates/base/null.j2 ADDED
@@ -0,0 +1,111 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {#
2
+
3
+ DO NOT USE THIS AS A BASE,
4
+ IF YOU ARE COPY AND PASTING THIS FILE
5
+ YOU ARE PROBABLY DOING THINGS INCORRECTLY.
6
+
7
+ Null template, does nothing except defining a basic structure
8
+ To layout the different blocks of a notebook.
9
+
10
+ Subtemplates can override blocks to define their custom representation.
11
+
12
+ If one of the block you do overwrite is not a leaf block, consider
13
+ calling super.
14
+
15
+ {%- block nonLeafBlock -%}
16
+ #add stuff at beginning
17
+ {{ super() }}
18
+ #add stuff at end
19
+ {%- endblock nonLeafBlock -%}
20
+
21
+ consider calling super even if it is a leaf block, we might insert more blocks later.
22
+
23
+ #}
24
+ {%- block header -%}
25
+ {%- endblock header -%}
26
+ {%- block body -%}
27
+ {%- block body_header -%}
28
+ {%- endblock body_header -%}
29
+ {%- block body_loop -%}
30
+ {%- for cell in nb.cells -%}
31
+ {%- block any_cell scoped -%}
32
+ {%- if cell.cell_type == 'code'-%}
33
+ {%- if resources.global_content_filter.include_code -%}
34
+ {%- block codecell scoped -%}
35
+ {%- if resources.global_content_filter.include_input and not cell.metadata.get("transient",{}).get("remove_source", false) -%}
36
+ {%- block input_group -%}
37
+ {%- if resources.global_content_filter.include_input_prompt -%}
38
+ {%- block in_prompt -%}{%- endblock in_prompt -%}
39
+ {%- endif -%}
40
+ {%- block input -%}{%- endblock input -%}
41
+ {%- endblock input_group -%}
42
+ {%- endif -%}
43
+ {%- if cell.outputs and resources.global_content_filter.include_output -%}
44
+ {%- block output_group -%}
45
+ {%- if resources.global_content_filter.include_output_prompt -%}
46
+ {%- block output_prompt -%}{%- endblock output_prompt -%}
47
+ {%- endif -%}
48
+ {%- block outputs scoped -%}
49
+ {%- for output in cell.outputs -%}
50
+ {%- block output scoped -%}
51
+ {%- if output.output_type == 'execute_result' -%}
52
+ {%- block execute_result scoped -%}{%- endblock execute_result -%}
53
+ {%- elif output.output_type == 'stream' -%}
54
+ {%- block stream scoped -%}
55
+ {%- if output.name == 'stdout' -%}
56
+ {%- block stream_stdout scoped -%}
57
+ {%- endblock stream_stdout -%}
58
+ {%- elif output.name == 'stderr' -%}
59
+ {%- block stream_stderr scoped -%}
60
+ {%- endblock stream_stderr -%}
61
+ {%- elif output.name == 'stdin' -%}
62
+ {%- block stream_stdin scoped -%}
63
+ {%- endblock stream_stdin -%}
64
+ {%- endif -%}
65
+ {%- endblock stream -%}
66
+ {%- elif output.output_type == 'display_data' -%}
67
+ {%- block display_data scoped -%}
68
+ {%- block data_priority scoped -%}
69
+ {%- endblock data_priority -%}
70
+ {%- endblock display_data -%}
71
+ {%- elif output.output_type == 'error' -%}
72
+ {%- block error scoped -%}
73
+ {%- for line in output.traceback -%}
74
+ {%- block traceback_line scoped -%}{%- endblock traceback_line -%}
75
+ {%- endfor -%}
76
+ {%- endblock error -%}
77
+ {%- endif -%}
78
+ {%- endblock output -%}
79
+ {%- endfor -%}
80
+ {%- endblock outputs -%}
81
+ {%- endblock output_group -%}
82
+ {%- endif -%}
83
+ {%- endblock codecell -%}
84
+ {%- endif -%}
85
+ {%- elif cell.cell_type in ['markdown'] -%}
86
+ {%- if resources.global_content_filter.include_markdown and not cell.metadata.get("transient",{}).get("remove_source", false) -%}
87
+ {%- block markdowncell scoped-%} {%- endblock markdowncell -%}
88
+ {%- endif -%}
89
+ {%- elif cell.cell_type in ['raw'] -%}
90
+ {%- if resources.global_content_filter.include_raw and not cell.metadata.get("transient",{}).get("remove_source", false) -%}
91
+ {%- block rawcell scoped -%}
92
+ {%- if cell.metadata.get('raw_mimetype', '').lower() in resources.get('raw_mimetypes', ['']) -%}
93
+ {{ cell.source }}
94
+ {%- endif -%}
95
+ {%- endblock rawcell -%}
96
+ {%- endif -%}
97
+ {%- else -%}
98
+ {%- if resources.global_content_filter.include_unknown and not cell.metadata.get("transient",{}).get("remove_source", false) -%}
99
+ {%- block unknowncell scoped-%}
100
+ {%- endblock unknowncell -%}
101
+ {%- endif -%}
102
+ {%- endif -%}
103
+ {%- endblock any_cell -%}
104
+ {%- endfor -%}
105
+ {%- endblock body_loop -%}
106
+ {%- block body_footer -%}
107
+ {%- endblock body_footer -%}
108
+ {%- endblock body -%}
109
+
110
+ {%- block footer -%}
111
+ {%- endblock footer -%}
emissary-ml/llm-scripts/fine-tuning/llama3/venv/share/jupyter/nbconvert/templates/reveal/index.html.j2 ADDED
@@ -0,0 +1,194 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {%- extends 'base.html.j2' -%}
2
+ {% from 'mathjax.html.j2' import mathjax %}
3
+ {% from 'jupyter_widgets.html.j2' import jupyter_widgets %}
4
+
5
+ {% set reveal_url_prefix = resources.reveal.url_prefix | default('https://unpkg.com/[email protected]', true) %}
6
+ {% set reveal_theme = resources.reveal.theme | default('white', true) %}
7
+ {% set reveal_transition = resources.reveal.transition | default('slide', true) %}
8
+ {% set reveal_number = resources.reveal.number | default('', true) %}
9
+ {% set reveal_width = resources.reveal.width | default('960', true) %}
10
+ {% set reveal_height = resources.reveal.height | default('700', true) %}
11
+ {% set reveal_scroll = resources.reveal.scroll | default(false, true) | json_dumps %}
12
+
13
+ {%- block header -%}
14
+ <!DOCTYPE html>
15
+ <html lang="{{ resources.language_code }}">
16
+ <head>
17
+
18
+ {%- block html_head -%}
19
+ <meta charset="utf-8" />
20
+ <meta http-equiv="X-UA-Compatible" content="chrome=1" />
21
+
22
+ <meta name="apple-mobile-web-app-capable" content="yes" />
23
+ <meta name="apple-mobile-web-app-status-bar-style" content="black-translucent" />
24
+
25
+ {% set nb_title = nb.metadata.get('title', resources['metadata']['name']) | escape_html_keep_quotes %}
26
+ <title>{{nb_title}} slides</title>
27
+
28
+ {%- block html_head_js -%}
29
+ {%- block html_head_js_jquery -%}
30
+ <script src="{{ resources.jquery_url }}"></script>
31
+ {%- endblock html_head_js_jquery -%}
32
+ {%- block html_head_js_requirejs -%}
33
+ <script src="{{ resources.require_js_url }}"></script>
34
+ {%- endblock html_head_js_requirejs -%}
35
+ {%- block html_head_js_mermaidjs -%}
36
+ <script type="module">
37
+ import mermaid from '{{ resources.mermaid_js_url }}';
38
+ mermaid.initialize({ startOnLoad: true });
39
+ </script>
40
+ {%- endblock html_head_js_mermaidjs -%}
41
+ {%- endblock html_head_js -%}
42
+
43
+ {% block jupyter_widgets %}
44
+ {%- if "widgets" in nb.metadata -%}
45
+ {{ jupyter_widgets(resources.jupyter_widgets_base_url, resources.html_manager_semver_range, resources.widget_renderer_url) }}
46
+ {%- endif -%}
47
+ {% endblock jupyter_widgets %}
48
+
49
+ <!-- General and theme style sheets -->
50
+ <link rel="stylesheet" href="{{ reveal_url_prefix }}/dist/reveal.css">
51
+
52
+ <!-- If the query includes 'print-pdf', include the PDF print sheet -->
53
+ <script>
54
+ if( window.location.search.match( /print-pdf/gi ) ) {
55
+ var link = document.createElement( 'link' );
56
+ link.rel = 'stylesheet';
57
+ link.type = 'text/css';
58
+ document.getElementsByTagName( 'head' )[0].appendChild( link );
59
+ }
60
+ </script>
61
+
62
+ {% for css in resources.inlining.css -%}
63
+ <style type="text/css">
64
+ {{ css }}
65
+ </style>
66
+ {% endfor %}
67
+
68
+ {% block notebook_css %}
69
+ {{ resources.include_css("static/index.css") }}
70
+ {% if resources.theme == 'dark' %}
71
+ {{ resources.include_css("static/theme-dark.css") }}
72
+ {% else %}
73
+ {{ resources.include_css("static/theme-light.css") }}
74
+ {% endif %}
75
+ <style type="text/css">
76
+ a.anchor-link {
77
+ display: none;
78
+ }
79
+ .highlight {
80
+ margin: 0.4em;
81
+ }
82
+ .jp-Notebook {
83
+ padding: 0;
84
+ }
85
+ :root {
86
+ --jp-ui-font-size1: 20px; /* instead of 14px */
87
+ --jp-content-font-size1: 20px; /* instead of 14px */
88
+ --jp-code-font-size: 19px; /* instead of 13px */
89
+ --jp-cell-prompt-width: 110px; /* instead of 64px */
90
+ }
91
+ @media print {
92
+ body {
93
+ margin: 0;
94
+ }
95
+ }
96
+ </style>
97
+
98
+ {{ resources.include_css("static/custom_reveal.css") }}
99
+
100
+ {% endblock notebook_css %}
101
+
102
+ {%- block html_head_js_mathjax -%}
103
+ {{ mathjax(resources.mathjax_url) }}
104
+ {%- endblock html_head_js_mathjax -%}
105
+
106
+ {%- block html_head_css -%}
107
+ {%- endblock html_head_css -%}
108
+
109
+ {%- endblock html_head -%}
110
+
111
+ <!-- Reveal Theme -->
112
+ <link rel="stylesheet" href="{{ reveal_url_prefix }}/dist/theme/{{reveal_theme}}.css" id="theme">
113
+
114
+ </head>
115
+ {% endblock header%}
116
+
117
+ {%- block body_header -%}
118
+ {% if resources.theme == 'dark' %}
119
+ <body class="jp-Notebook" data-jp-theme-light="false" data-jp-theme-name="JupyterLab Dark">
120
+ {% else %}
121
+ <body class="jp-Notebook" data-jp-theme-light="true" data-jp-theme-name="JupyterLab Light">
122
+ {% endif %}
123
+ <main>
124
+ <div class="reveal">
125
+ <div class="slides">
126
+ {%- endblock body_header -%}
127
+
128
+ {% block body_footer %}
129
+ </div>
130
+ </div>
131
+ </main>
132
+ </body>
133
+ {% endblock body_footer %}
134
+
135
+ {% block footer %}
136
+ {{ super() }}
137
+
138
+ {% block footer_js %}
139
+ <script>
140
+ require(
141
+ {
142
+ // it makes sense to wait a little bit when you are loading
143
+ // reveal from a cdn in a slow connection environment
144
+ waitSeconds: 15
145
+ },
146
+ [
147
+ "{{ reveal_url_prefix }}/dist/reveal.js",
148
+ "{{ reveal_url_prefix }}/plugin/notes/notes.js"
149
+ ],
150
+
151
+ function(Reveal, RevealNotes){
152
+ // Full list of configuration options available here: https://github.com/hakimel/reveal.js#configuration
153
+ Reveal.initialize({
154
+ controls: true,
155
+ progress: true,
156
+ history: true,
157
+ transition: "{{reveal_transition}}",
158
+ slideNumber: "{{reveal_number}}",
159
+ plugins: [RevealNotes],
160
+ width: {{reveal_width}},
161
+ height: {{reveal_height}},
162
+
163
+ });
164
+
165
+ var update = function(event){
166
+ if(MathJax.Hub.getAllJax(Reveal.getCurrentSlide())){
167
+ MathJax.Hub.Rerender(Reveal.getCurrentSlide());
168
+ }
169
+ };
170
+
171
+ Reveal.addEventListener('slidechanged', update);
172
+
173
+ function setScrollingSlide() {
174
+ var scroll = {{ reveal_scroll }}
175
+ if (scroll === true) {
176
+ var h = $('.reveal').height() * 0.95;
177
+ $('section.present').find('section')
178
+ .filter(function() {
179
+ return $(this).height() > h;
180
+ })
181
+ .css('height', 'calc(95vh)')
182
+ .css('overflow-y', 'scroll')
183
+ .css('margin-top', '20px');
184
+ }
185
+ }
186
+
187
+ // check and set the scrolling slide every time the slide change
188
+ Reveal.addEventListener('slidechanged', setScrollingSlide);
189
+ }
190
+ );
191
+ </script>
192
+ {% endblock footer_js %}
193
+ </html>
194
+ {% endblock footer %}
emissary-ml/llm-scripts/fine-tuning/llama3/venv/share/jupyter/nbconvert/templates/reveal/static/custom_reveal.css ADDED
@@ -0,0 +1,121 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ /* Overrides of notebook CSS for static HTML export */
2
+ .reveal {
3
+ font-size: 160%;
4
+ }
5
+ .reveal table {
6
+ font-size: var(--jp-ui-font-size1);
7
+ }
8
+ .reveal pre {
9
+ width: inherit;
10
+ padding: 0.4em;
11
+ margin: 0px;
12
+ font-family: monospace, sans-serif;
13
+ font-size: 80%;
14
+ box-shadow: 0px 0px 0px rgba(0, 0, 0, 0);
15
+ }
16
+ .reveal pre code {
17
+ padding: 0px;
18
+ }
19
+ .reveal section img {
20
+ border: 0px solid black;
21
+ box-shadow: 0 0 10px rgba(0, 0, 0, 0);
22
+ }
23
+ .reveal .slides {
24
+ text-align: left;
25
+ }
26
+ .reveal.fade {
27
+ opacity: 1;
28
+ }
29
+ .reveal .progress {
30
+ position: static;
31
+ }
32
+
33
+ div.jp-InputArea-editor {
34
+ padding: 0.06em;
35
+ }
36
+
37
+ div.code_cell {
38
+ background-color: transparent;
39
+ }
40
+
41
+ div.output_area pre {
42
+ font-family: monospace, sans-serif;
43
+ font-size: 80%;
44
+ }
45
+
46
+ div.jp-OutputPrompt {
47
+ /* 5px right shift to account for margin in parent container */
48
+ margin: 5px 5px 0 0;
49
+ }
50
+
51
+ .reveal div.highlight {
52
+ margin: 0;
53
+ }
54
+
55
+ .reveal div.highlight > pre {
56
+ margin: 0;
57
+ width: 100%;
58
+ font-size: var(--jp-code-font-size);
59
+ }
60
+
61
+ .reveal div.jp-OutputArea-output > pre {
62
+ margin: 0;
63
+ width: 90%;
64
+ font-size: var(--jp-code-font-size);
65
+ box-shadow: none;
66
+ }
67
+
68
+ main {
69
+ height: 100%;
70
+ }
71
+
72
+ /* Reveal navigation controls */
73
+
74
+ .reveal .controls .navigate-left,
75
+ .reveal .controls .navigate-left.enabled {
76
+ border-right-color: #727272;
77
+ }
78
+ .reveal .controls .navigate-left.enabled:hover,
79
+ .reveal .controls .navigate-left.enabled.enabled:hover {
80
+ border-right-color: #dfdfdf;
81
+ }
82
+ .reveal .controls .navigate-right,
83
+ .reveal .controls .navigate-right.enabled {
84
+ border-left-color: #727272;
85
+ }
86
+ .reveal .controls .navigate-right.enabled:hover,
87
+ .reveal .controls .navigate-right.enabled.enabled:hover {
88
+ border-left-color: #dfdfdf;
89
+ }
90
+ .reveal .controls .navigate-up,
91
+ .reveal .controls .navigate-up.enabled {
92
+ border-bottom-color: #727272;
93
+ }
94
+ .reveal .controls .navigate-up.enabled:hover,
95
+ .reveal .controls .navigate-up.enabled.enabled:hover {
96
+ border-bottom-color: #dfdfdf;
97
+ }
98
+ .reveal .controls .navigate-down,
99
+ .reveal .controls .navigate-down.enabled {
100
+ border-top-color: #727272;
101
+ }
102
+ .reveal .controls .navigate-down.enabled:hover,
103
+ .reveal .controls .navigate-down.enabled.enabled:hover {
104
+ border-top-color: #dfdfdf;
105
+ }
106
+ .reveal .progress span {
107
+ background: #727272;
108
+ }
109
+
110
+ /* Scrollbars */
111
+
112
+ ::-webkit-scrollbar {
113
+ width: 6px;
114
+ height: 6px;
115
+ }
116
+ ::-webkit-scrollbar * {
117
+ background: transparent;
118
+ }
119
+ ::-webkit-scrollbar-thumb {
120
+ background: #727272 !important;
121
+ }
emissary-ml/llm-scripts/fine-tuning/llama3/venv/share/jupyter/nbconvert/templates/rst/conf.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "base_template": "base",
3
+ "mimetypes": {
4
+ "text/x-rst": true
5
+ }
6
+ }
emissary-ml/llm-scripts/fine-tuning/llama3/venv/share/jupyter/nbconvert/templates/rst/index.rst.j2 ADDED
@@ -0,0 +1,117 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {%- extends 'display_priority.j2' -%}
2
+
3
+
4
+ {% block in_prompt %}
5
+ {% endblock in_prompt %}
6
+
7
+ {% block output_prompt %}
8
+ {% endblock output_prompt %}
9
+
10
+ {% block input scoped%}
11
+ {%- if cell.source.strip() -%}
12
+ {{".. code:: "-}}
13
+ {%- if 'magics_language' in cell.metadata -%}
14
+ {{ cell.metadata.magics_language}}
15
+ {%- elif 'pygments_lexer' in nb.metadata.get('language_info', {}) -%}
16
+ {{ nb.metadata.language_info.pygments_lexer }}
17
+ {%- elif 'name' in nb.metadata.get('language_info', {}) -%}
18
+ {{ nb.metadata.language_info.name }}
19
+ {%- endif %}
20
+
21
+ {{ cell.source | indent}}
22
+ {% endif -%}
23
+ {% endblock input %}
24
+
25
+ {% block error %}
26
+ ::
27
+
28
+ {{ super() }}
29
+ {% endblock error %}
30
+
31
+ {% block traceback_line %}
32
+ {{ line | indent | strip_ansi }}
33
+ {% endblock traceback_line %}
34
+
35
+ {% block execute_result %}
36
+ {% block data_priority scoped %}
37
+ {{ super() }}
38
+ {% endblock %}
39
+ {% endblock execute_result %}
40
+
41
+ {% block stream %}
42
+ .. parsed-literal::
43
+
44
+ {{ output.text | indent }}
45
+ {% endblock stream %}
46
+
47
+ {% block data_native %}
48
+ {{ output.data['text/x-rst'] }}
49
+ {% endblock data_native %}
50
+
51
+ {% block data_svg %}
52
+ .. image:: {{ output.metadata.filenames['image/svg+xml'] | urlencode }}
53
+ {% endblock data_svg %}
54
+
55
+ {% block data_png %}
56
+ .. image:: {{ output.metadata.filenames['image/png'] | urlencode }}
57
+ {%- set width=output | get_metadata('width', 'image/png') -%}
58
+ {%- if width is not none %}
59
+ :width: {{ width }}px
60
+ {%- endif %}
61
+ {%- set height=output | get_metadata('height', 'image/png') -%}
62
+ {%- if height is not none %}
63
+ :height: {{ height }}px
64
+ {%- endif %}
65
+ {% endblock data_png %}
66
+
67
+ {% block data_jpg %}
68
+ .. image:: {{ output.metadata.filenames['image/jpeg'] | urlencode }}
69
+ {%- set width=output | get_metadata('width', 'image/jpeg') -%}
70
+ {%- if width is not none %}
71
+ :width: {{ width }}px
72
+ {%- endif %}
73
+ {%- set height=output | get_metadata('height', 'image/jpeg') -%}
74
+ {%- if height is not none %}
75
+ :height: {{ height }}px
76
+ {%- endif %}
77
+ {% endblock data_jpg %}
78
+
79
+ {% block data_markdown %}
80
+ {{ output.data['text/markdown'] | convert_pandoc("markdown", "rst") }}
81
+ {% endblock data_markdown %}
82
+
83
+ {% block data_latex %}
84
+ .. math::
85
+
86
+ {{ output.data['text/latex'] | strip_dollars | indent }}
87
+ {% endblock data_latex %}
88
+
89
+ {% block data_text scoped %}
90
+ .. parsed-literal::
91
+
92
+ {{ output.data['text/plain'] | indent }}
93
+ {% endblock data_text %}
94
+
95
+ {% block data_html scoped %}
96
+ .. raw:: html
97
+
98
+ {{ output.data['text/html'] | indent }}
99
+ {% endblock data_html %}
100
+
101
+ {% block markdowncell scoped %}
102
+ {{ cell.source | convert_pandoc("markdown", "rst") }}
103
+ {% endblock markdowncell %}
104
+
105
+ {%- block rawcell scoped -%}
106
+ {%- if cell.metadata.get('raw_mimetype', '').lower() in resources.get('raw_mimetypes', ['']) %}
107
+ {{cell.source}}
108
+ {% endif -%}
109
+ {%- endblock rawcell -%}
110
+
111
+ {% block headingcell scoped %}
112
+ {{ ("#" * cell.level + cell.source) | replace('\n', ' ') | convert_pandoc("markdown", "rst") }}
113
+ {% endblock headingcell %}
114
+
115
+ {% block unknowncell scoped %}
116
+ unknown type {{cell.type}}
117
+ {% endblock unknowncell %}
emissary-ml/llm-scripts/fine-tuning/llama3/wandb/debug.log ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2025-08-11 23:43:33,509 INFO MainThread:96305 [wandb_setup.py:_flush():76] Current SDK version is 0.16.5
2
+ 2025-08-11 23:43:33,509 INFO MainThread:96305 [wandb_setup.py:_flush():76] Configure stats pid to 96305
3
+ 2025-08-11 23:43:33,509 INFO MainThread:96305 [wandb_setup.py:_flush():76] Loading settings from /root/.config/wandb/settings
4
+ 2025-08-11 23:43:33,509 INFO MainThread:96305 [wandb_setup.py:_flush():76] Loading settings from /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/settings
5
+ 2025-08-11 23:43:33,509 WARNING MainThread:96305 [wandb_setup.py:_flush():76] Unknown environment variable: WANDB_KEY
6
+ 2025-08-11 23:43:33,509 INFO MainThread:96305 [wandb_setup.py:_flush():76] Loading settings from environment variables: {}
7
+ 2025-08-11 23:43:33,509 INFO MainThread:96305 [wandb_setup.py:_flush():76] Inferring run settings from compute environment: {'program_relpath': 'llm-scripts/fine-tuning/llama3/train.py', 'program_abspath': '/home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/train.py', 'program': '/home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/train.py'}
8
+ 2025-08-11 23:43:33,509 INFO MainThread:96305 [wandb_setup.py:_flush():76] Applying login settings: {'api_key': '***REDACTED***'}
9
+ 2025-08-11 23:43:33,509 INFO MainThread:96305 [wandb_setup.py:_flush():76] Applying login settings: {'api_key': '***REDACTED***'}
10
+ 2025-08-11 23:43:33,509 INFO MainThread:96305 [wandb_setup.py:_flush():76] Applying login settings: {}
11
+ 2025-08-11 23:43:33,509 INFO MainThread:96305 [wandb_init.py:_log_setup():527] Logging user logs to /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_234333-63gx7jwn/logs/debug.log
12
+ 2025-08-11 23:43:33,509 INFO MainThread:96305 [wandb_init.py:_log_setup():528] Logging internal logs to /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_234333-63gx7jwn/logs/debug-internal.log
13
+ 2025-08-11 23:43:33,509 INFO MainThread:96305 [wandb_init.py:init():567] calling init triggers
14
+ 2025-08-11 23:43:33,509 INFO MainThread:96305 [wandb_init.py:init():574] wandb.init called with sweep_config: {}
15
+ config: {}
16
+ 2025-08-11 23:43:33,509 INFO MainThread:96305 [wandb_init.py:init():617] starting backend
17
+ 2025-08-11 23:43:33,510 INFO MainThread:96305 [wandb_init.py:init():621] setting up manager
18
+ 2025-08-11 23:43:33,512 INFO MainThread:96305 [backend.py:_multiprocessing_setup():105] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
19
+ 2025-08-11 23:43:33,513 INFO MainThread:96305 [wandb_init.py:init():629] backend started and connected
20
+ 2025-08-11 23:43:33,521 INFO MainThread:96305 [wandb_init.py:init():721] updated telemetry
21
+ 2025-08-11 23:43:33,526 INFO MainThread:96305 [wandb_init.py:init():754] communicating run to backend with 90.0 second timeout
22
+ 2025-08-11 23:43:33,828 INFO MainThread:96305 [wandb_run.py:_on_init():2344] communicating current version
23
+ 2025-08-11 23:43:33,868 INFO MainThread:96305 [wandb_run.py:_on_init():2353] got version response upgrade_message: "wandb version 0.21.1 is available! To upgrade, please run:\n $ pip install wandb --upgrade"
24
+
25
+ 2025-08-11 23:43:33,868 INFO MainThread:96305 [wandb_init.py:init():805] starting run threads in backend
26
+ 2025-08-11 23:43:34,670 INFO MainThread:96305 [wandb_run.py:_console_start():2323] atexit reg
27
+ 2025-08-11 23:43:34,670 INFO MainThread:96305 [wandb_run.py:_redirect():2178] redirect: wrap_raw
28
+ 2025-08-11 23:43:34,670 INFO MainThread:96305 [wandb_run.py:_redirect():2243] Wrapping output streams.
29
+ 2025-08-11 23:43:34,671 INFO MainThread:96305 [wandb_run.py:_redirect():2268] Redirects installed.
30
+ 2025-08-11 23:43:34,671 INFO MainThread:96305 [wandb_init.py:init():848] run started, returning control to user process
31
+ 2025-08-11 23:47:14,511 INFO MainThread:96305 [wandb_run.py:_config_callback():1347] config_cb None None {'peft_config': {'default': {'task_type': 'CAUSAL_LM', 'peft_type': <PeftType.LORA: 'LORA'>, 'auto_mapping': None, 'base_model_name_or_path': 'emissary-ai/Python-Tab-Completion-CodeLlama-70b', 'revision': None, 'inference_mode': False, 'r': 16, 'target_modules': {'v_proj', 'up_proj', 'gate_proj', 'q_proj', 'k_proj', 'down_proj', 'o_proj'}, 'exclude_modules': None, 'lora_alpha': 64, 'lora_dropout': 0.05, 'fan_in_fan_out': False, 'bias': 'none', 'use_rslora': False, 'modules_to_save': None, 'init_lora_weights': True, 'layers_to_transform': None, 'layers_pattern': None, 'rank_pattern': {}, 'alpha_pattern': {}, 'megatron_config': None, 'megatron_core': 'megatron.core', 'trainable_token_indices': None, 'loftq_config': {}, 'eva_config': None, 'corda_config': None, 'use_dora': False, 'use_qalora': False, 'qalora_group_size': 16, 'layer_replication': None, 'runtime_config': {'ephemeral_gpu_offload': False}, 'lora_bias': False, 'target_parameters': None}}, 'vocab_size': 32016, 'max_position_embeddings': 131072, 'hidden_size': 8192, 'intermediate_size': 28672, 'num_hidden_layers': 80, 'num_attention_heads': 64, 'num_key_value_heads': 8, 'hidden_act': 'silu', 'initializer_range': 0.02, 'rms_norm_eps': 1e-05, 'pretraining_tp': 1, 'use_cache': True, 'rope_theta': 10000, 'rope_scaling': None, 'attention_bias': False, 'attention_dropout': 0.0, 'mlp_bias': False, 'head_dim': 128, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'torch_dtype': 'float16', 'pruned_heads': {}, 'tie_word_embeddings': False, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['LlamaForCausalLM'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': 1, 'pad_token_id': 2, 'eos_token_id': 2, 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, '_name_or_path': 'emissary-ai/Python-Tab-Completion-CodeLlama-70b', 'transformers_version': '4.55.0', 'model_type': 'llama', 'tf_legacy_loss': False, 'use_bfloat16': False, 'quantization_config': {'quant_method': 'QuantizationMethod.BITS_AND_BYTES', '_load_in_8bit': True, '_load_in_4bit': False, 'llm_int8_threshold': 6.0, 'llm_int8_skip_modules': None, 'llm_int8_enable_fp32_cpu_offload': False, 'llm_int8_has_fp16_weight': False, 'bnb_4bit_quant_type': 'fp4', 'bnb_4bit_use_double_quant': False, 'bnb_4bit_compute_dtype': 'float32', 'bnb_4bit_quant_storage': 'uint8', 'load_in_4bit': False, 'load_in_8bit': True}, 'output_attentions': False, 'output_dir': 'checkpoints', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': False, 'do_predict': False, 'eval_strategy': 'no', 'prediction_loss_only': False, 'per_device_train_batch_size': 4, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 16, 'eval_accumulation_steps': None, 'eval_delay': 0, 'torch_empty_cache_steps': None, 'learning_rate': 0.0002, 'weight_decay': 0.01, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 0.3, 'num_train_epochs': 0, 'max_steps': 0, 'lr_scheduler_type': 'linear', 'lr_scheduler_kwargs': {}, 'warmup_ratio': 0.0, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': 'checkpoints/runs/Aug11_23-47-13_shadecloud', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 10, 'logging_nan_inf_filter': True, 'save_strategy': 'epoch', 'save_steps': 99999, 'save_total_limit': None, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'restore_callback_states_from_checkpoint': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 3407, 'data_seed': None, 'jit_mode_eval': False, 'use_ipex': False, 'bf16': False, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': False, 'eval_steps': None, 'dataloader_num_workers': 0, 'dataloader_prefetch_factor': None, 'past_index': -1, 'run_name': None, 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'paged_adamw_8bit', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['wandb'], 'ddp_find_unused_parameters': False, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': None, 'hub_always_push': False, 'hub_revision': None, 'gradient_checkpointing': True, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'include_for_metrics': [], 'eval_do_concat_batches': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': True, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 1800, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': False, 'neftune_noise_alpha': None, 'optim_target_modules': None, 'batch_eval_metrics': False, 'eval_on_start': False, 'use_liger_kernel': False, 'liger_kernel_config': None, 'eval_use_gather_object': False, 'average_tokens_across_devices': False, 'model_init_kwargs': None, 'use_liger': False, 'dataset_text_field': 'text', 'dataset_kwargs': None, 'dataset_num_proc': None, 'max_seq_length': 1024, 'packing': False, 'eval_packing': None, 'dataset_batch_size': None, 'num_of_sequences': None, 'chars_per_token': '<CHARS_PER_TOKEN>'}
32
+ 2025-08-11 23:47:14,520 INFO MainThread:96305 [wandb_config.py:__setitem__():151] config set model/num_parameters = 69184004096 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7f75842f5780>>
33
+ 2025-08-11 23:47:14,520 INFO MainThread:96305 [wandb_run.py:_config_callback():1347] config_cb model/num_parameters 69184004096 None
34
+ 2025-08-11 23:47:55,627 WARNING MsgRouterThr:96305 [router.py:message_loop():77] message_loop has been closed
emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_231120-bt4spvmx/files/wandb-metadata.json ADDED
@@ -0,0 +1,741 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "os": "Linux-5.15.0-151-generic-x86_64-with-glibc2.35",
3
+ "python": "3.10.12",
4
+ "heartbeatAt": "2025-08-11T23:11:21.233602",
5
+ "startedAt": "2025-08-11T23:11:20.295305",
6
+ "docker": null,
7
+ "cuda": null,
8
+ "args": [
9
+ "--dataset_path",
10
+ "/home/shadeform/tr-5ekuRmvnwgDznEKHAQcBL2-train.jsonl",
11
+ "--dataset_id",
12
+ "ds-9eYnuJhismAkC4AqzDXuVo",
13
+ "--test_dataset_path",
14
+ "/home/shadeform/tr-5ekuRmvnwgDznEKHAQcBL2-test.jsonl",
15
+ "--test_data_id",
16
+ "ds-MLF2XiyMxXD4CPsrLwKYAY",
17
+ "--service_id",
18
+ "ms-DbLTHy7dKWzyFzjvLDENkY",
19
+ "--training_id",
20
+ "tr-Mwx5sYhG3PnojUx9dNq3Bn",
21
+ "--user_id",
22
+ "user_2dNEee5lJORqWKAhGHurdhTLvEQ",
23
+ "--task_type",
24
+ "text-generation",
25
+ "--model_name",
26
+ "Llama3.1-8B-Instruct",
27
+ "--base_model_link",
28
+ "emissary-ai/Python-Tab-Completion-CodeLlama-70b",
29
+ "--is_external",
30
+ "false",
31
+ "--training_technique",
32
+ "SFT"
33
+ ],
34
+ "state": "running",
35
+ "program": "/home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/train.py",
36
+ "codePathLocal": "train.py",
37
+ "codePath": "llm-scripts/fine-tuning/llama3/train.py",
38
+ "git": {
39
+ "remote": "https://coloryourlife:@github.com/Emissary-Tech/emissary-ml.git",
40
+ "commit": "0143ec41bec5a001ce9b65ac366aa9ddd6cdc966"
41
+ },
42
+ "email": null,
43
+ "root": "/home/shadeform/emissary-ml",
44
+ "host": "shadecloud",
45
+ "username": "root",
46
+ "executable": "/home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/venv/bin/python",
47
+ "cpu_count": 64,
48
+ "cpu_count_logical": 128,
49
+ "cpu_freq": {
50
+ "current": 2236.7202578124998,
51
+ "min": 1500.0,
52
+ "max": 3250.0
53
+ },
54
+ "cpu_freq_per_core": [
55
+ {
56
+ "current": 1500.0,
57
+ "min": 1500.0,
58
+ "max": 3250.0
59
+ },
60
+ {
61
+ "current": 1500.0,
62
+ "min": 1500.0,
63
+ "max": 3250.0
64
+ },
65
+ {
66
+ "current": 1500.0,
67
+ "min": 1500.0,
68
+ "max": 3250.0
69
+ },
70
+ {
71
+ "current": 1500.0,
72
+ "min": 1500.0,
73
+ "max": 3250.0
74
+ },
75
+ {
76
+ "current": 1500.0,
77
+ "min": 1500.0,
78
+ "max": 3250.0
79
+ },
80
+ {
81
+ "current": 1500.0,
82
+ "min": 1500.0,
83
+ "max": 3250.0
84
+ },
85
+ {
86
+ "current": 1500.0,
87
+ "min": 1500.0,
88
+ "max": 3250.0
89
+ },
90
+ {
91
+ "current": 1500.0,
92
+ "min": 1500.0,
93
+ "max": 3250.0
94
+ },
95
+ {
96
+ "current": 1500.0,
97
+ "min": 1500.0,
98
+ "max": 3250.0
99
+ },
100
+ {
101
+ "current": 1500.0,
102
+ "min": 1500.0,
103
+ "max": 3250.0
104
+ },
105
+ {
106
+ "current": 3250.0,
107
+ "min": 1500.0,
108
+ "max": 3250.0
109
+ },
110
+ {
111
+ "current": 1500.0,
112
+ "min": 1500.0,
113
+ "max": 3250.0
114
+ },
115
+ {
116
+ "current": 1500.0,
117
+ "min": 1500.0,
118
+ "max": 3250.0
119
+ },
120
+ {
121
+ "current": 1500.0,
122
+ "min": 1500.0,
123
+ "max": 3250.0
124
+ },
125
+ {
126
+ "current": 1500.0,
127
+ "min": 1500.0,
128
+ "max": 3250.0
129
+ },
130
+ {
131
+ "current": 1500.0,
132
+ "min": 1500.0,
133
+ "max": 3250.0
134
+ },
135
+ {
136
+ "current": 1500.0,
137
+ "min": 1500.0,
138
+ "max": 3250.0
139
+ },
140
+ {
141
+ "current": 1500.0,
142
+ "min": 1500.0,
143
+ "max": 3250.0
144
+ },
145
+ {
146
+ "current": 1500.0,
147
+ "min": 1500.0,
148
+ "max": 3250.0
149
+ },
150
+ {
151
+ "current": 1500.0,
152
+ "min": 1500.0,
153
+ "max": 3250.0
154
+ },
155
+ {
156
+ "current": 1500.0,
157
+ "min": 1500.0,
158
+ "max": 3250.0
159
+ },
160
+ {
161
+ "current": 1500.0,
162
+ "min": 1500.0,
163
+ "max": 3250.0
164
+ },
165
+ {
166
+ "current": 1500.0,
167
+ "min": 1500.0,
168
+ "max": 3250.0
169
+ },
170
+ {
171
+ "current": 3250.0,
172
+ "min": 1500.0,
173
+ "max": 3250.0
174
+ },
175
+ {
176
+ "current": 1500.0,
177
+ "min": 1500.0,
178
+ "max": 3250.0
179
+ },
180
+ {
181
+ "current": 1500.0,
182
+ "min": 1500.0,
183
+ "max": 3250.0
184
+ },
185
+ {
186
+ "current": 1500.0,
187
+ "min": 1500.0,
188
+ "max": 3250.0
189
+ },
190
+ {
191
+ "current": 1500.0,
192
+ "min": 1500.0,
193
+ "max": 3250.0
194
+ },
195
+ {
196
+ "current": 1500.0,
197
+ "min": 1500.0,
198
+ "max": 3250.0
199
+ },
200
+ {
201
+ "current": 1500.0,
202
+ "min": 1500.0,
203
+ "max": 3250.0
204
+ },
205
+ {
206
+ "current": 1500.0,
207
+ "min": 1500.0,
208
+ "max": 3250.0
209
+ },
210
+ {
211
+ "current": 1500.0,
212
+ "min": 1500.0,
213
+ "max": 3250.0
214
+ },
215
+ {
216
+ "current": 1500.0,
217
+ "min": 1500.0,
218
+ "max": 3250.0
219
+ },
220
+ {
221
+ "current": 3250.0,
222
+ "min": 1500.0,
223
+ "max": 3250.0
224
+ },
225
+ {
226
+ "current": 1500.0,
227
+ "min": 1500.0,
228
+ "max": 3250.0
229
+ },
230
+ {
231
+ "current": 3250.0,
232
+ "min": 1500.0,
233
+ "max": 3250.0
234
+ },
235
+ {
236
+ "current": 3250.0,
237
+ "min": 1500.0,
238
+ "max": 3250.0
239
+ },
240
+ {
241
+ "current": 3250.0,
242
+ "min": 1500.0,
243
+ "max": 3250.0
244
+ },
245
+ {
246
+ "current": 3250.0,
247
+ "min": 1500.0,
248
+ "max": 3250.0
249
+ },
250
+ {
251
+ "current": 3250.0,
252
+ "min": 1500.0,
253
+ "max": 3250.0
254
+ },
255
+ {
256
+ "current": 3250.0,
257
+ "min": 1500.0,
258
+ "max": 3250.0
259
+ },
260
+ {
261
+ "current": 3250.0,
262
+ "min": 1500.0,
263
+ "max": 3250.0
264
+ },
265
+ {
266
+ "current": 3250.0,
267
+ "min": 1500.0,
268
+ "max": 3250.0
269
+ },
270
+ {
271
+ "current": 3250.0,
272
+ "min": 1500.0,
273
+ "max": 3250.0
274
+ },
275
+ {
276
+ "current": 2300.0,
277
+ "min": 1500.0,
278
+ "max": 3250.0
279
+ },
280
+ {
281
+ "current": 3250.0,
282
+ "min": 1500.0,
283
+ "max": 3250.0
284
+ },
285
+ {
286
+ "current": 3250.0,
287
+ "min": 1500.0,
288
+ "max": 3250.0
289
+ },
290
+ {
291
+ "current": 3250.0,
292
+ "min": 1500.0,
293
+ "max": 3250.0
294
+ },
295
+ {
296
+ "current": 3250.0,
297
+ "min": 1500.0,
298
+ "max": 3250.0
299
+ },
300
+ {
301
+ "current": 3250.0,
302
+ "min": 1500.0,
303
+ "max": 3250.0
304
+ },
305
+ {
306
+ "current": 3250.0,
307
+ "min": 1500.0,
308
+ "max": 3250.0
309
+ },
310
+ {
311
+ "current": 2300.0,
312
+ "min": 1500.0,
313
+ "max": 3250.0
314
+ },
315
+ {
316
+ "current": 3250.0,
317
+ "min": 1500.0,
318
+ "max": 3250.0
319
+ },
320
+ {
321
+ "current": 3250.0,
322
+ "min": 1500.0,
323
+ "max": 3250.0
324
+ },
325
+ {
326
+ "current": 3250.0,
327
+ "min": 1500.0,
328
+ "max": 3250.0
329
+ },
330
+ {
331
+ "current": 2300.0,
332
+ "min": 1500.0,
333
+ "max": 3250.0
334
+ },
335
+ {
336
+ "current": 3250.0,
337
+ "min": 1500.0,
338
+ "max": 3250.0
339
+ },
340
+ {
341
+ "current": 1500.0,
342
+ "min": 1500.0,
343
+ "max": 3250.0
344
+ },
345
+ {
346
+ "current": 3250.0,
347
+ "min": 1500.0,
348
+ "max": 3250.0
349
+ },
350
+ {
351
+ "current": 1500.0,
352
+ "min": 1500.0,
353
+ "max": 3250.0
354
+ },
355
+ {
356
+ "current": 3250.0,
357
+ "min": 1500.0,
358
+ "max": 3250.0
359
+ },
360
+ {
361
+ "current": 3250.0,
362
+ "min": 1500.0,
363
+ "max": 3250.0
364
+ },
365
+ {
366
+ "current": 1500.0,
367
+ "min": 1500.0,
368
+ "max": 3250.0
369
+ },
370
+ {
371
+ "current": 3250.0,
372
+ "min": 1500.0,
373
+ "max": 3250.0
374
+ },
375
+ {
376
+ "current": 1500.0,
377
+ "min": 1500.0,
378
+ "max": 3250.0
379
+ },
380
+ {
381
+ "current": 1500.0,
382
+ "min": 1500.0,
383
+ "max": 3250.0
384
+ },
385
+ {
386
+ "current": 1500.0,
387
+ "min": 1500.0,
388
+ "max": 3250.0
389
+ },
390
+ {
391
+ "current": 1500.0,
392
+ "min": 1500.0,
393
+ "max": 3250.0
394
+ },
395
+ {
396
+ "current": 1500.0,
397
+ "min": 1500.0,
398
+ "max": 3250.0
399
+ },
400
+ {
401
+ "current": 1500.0,
402
+ "min": 1500.0,
403
+ "max": 3250.0
404
+ },
405
+ {
406
+ "current": 1500.0,
407
+ "min": 1500.0,
408
+ "max": 3250.0
409
+ },
410
+ {
411
+ "current": 1500.0,
412
+ "min": 1500.0,
413
+ "max": 3250.0
414
+ },
415
+ {
416
+ "current": 1500.0,
417
+ "min": 1500.0,
418
+ "max": 3250.0
419
+ },
420
+ {
421
+ "current": 1500.0,
422
+ "min": 1500.0,
423
+ "max": 3250.0
424
+ },
425
+ {
426
+ "current": 1500.0,
427
+ "min": 1500.0,
428
+ "max": 3250.0
429
+ },
430
+ {
431
+ "current": 1500.0,
432
+ "min": 1500.0,
433
+ "max": 3250.0
434
+ },
435
+ {
436
+ "current": 1500.0,
437
+ "min": 1500.0,
438
+ "max": 3250.0
439
+ },
440
+ {
441
+ "current": 1500.0,
442
+ "min": 1500.0,
443
+ "max": 3250.0
444
+ },
445
+ {
446
+ "current": 1500.0,
447
+ "min": 1500.0,
448
+ "max": 3250.0
449
+ },
450
+ {
451
+ "current": 1500.0,
452
+ "min": 1500.0,
453
+ "max": 3250.0
454
+ },
455
+ {
456
+ "current": 1500.0,
457
+ "min": 1500.0,
458
+ "max": 3250.0
459
+ },
460
+ {
461
+ "current": 1500.0,
462
+ "min": 1500.0,
463
+ "max": 3250.0
464
+ },
465
+ {
466
+ "current": 1500.0,
467
+ "min": 1500.0,
468
+ "max": 3250.0
469
+ },
470
+ {
471
+ "current": 1500.0,
472
+ "min": 1500.0,
473
+ "max": 3250.0
474
+ },
475
+ {
476
+ "current": 1500.0,
477
+ "min": 1500.0,
478
+ "max": 3250.0
479
+ },
480
+ {
481
+ "current": 1500.0,
482
+ "min": 1500.0,
483
+ "max": 3250.0
484
+ },
485
+ {
486
+ "current": 1500.0,
487
+ "min": 1500.0,
488
+ "max": 3250.0
489
+ },
490
+ {
491
+ "current": 1500.0,
492
+ "min": 1500.0,
493
+ "max": 3250.0
494
+ },
495
+ {
496
+ "current": 1500.0,
497
+ "min": 1500.0,
498
+ "max": 3250.0
499
+ },
500
+ {
501
+ "current": 1500.0,
502
+ "min": 1500.0,
503
+ "max": 3250.0
504
+ },
505
+ {
506
+ "current": 1500.0,
507
+ "min": 1500.0,
508
+ "max": 3250.0
509
+ },
510
+ {
511
+ "current": 3250.0,
512
+ "min": 1500.0,
513
+ "max": 3250.0
514
+ },
515
+ {
516
+ "current": 3250.0,
517
+ "min": 1500.0,
518
+ "max": 3250.0
519
+ },
520
+ {
521
+ "current": 1500.0,
522
+ "min": 1500.0,
523
+ "max": 3250.0
524
+ },
525
+ {
526
+ "current": 1500.0,
527
+ "min": 1500.0,
528
+ "max": 3250.0
529
+ },
530
+ {
531
+ "current": 1500.0,
532
+ "min": 1500.0,
533
+ "max": 3250.0
534
+ },
535
+ {
536
+ "current": 3250.0,
537
+ "min": 1500.0,
538
+ "max": 3250.0
539
+ },
540
+ {
541
+ "current": 3250.0,
542
+ "min": 1500.0,
543
+ "max": 3250.0
544
+ },
545
+ {
546
+ "current": 3250.0,
547
+ "min": 1500.0,
548
+ "max": 3250.0
549
+ },
550
+ {
551
+ "current": 3800.218,
552
+ "min": 1500.0,
553
+ "max": 3250.0
554
+ },
555
+ {
556
+ "current": 3250.0,
557
+ "min": 1500.0,
558
+ "max": 3250.0
559
+ },
560
+ {
561
+ "current": 2300.0,
562
+ "min": 1500.0,
563
+ "max": 3250.0
564
+ },
565
+ {
566
+ "current": 1500.0,
567
+ "min": 1500.0,
568
+ "max": 3250.0
569
+ },
570
+ {
571
+ "current": 2300.0,
572
+ "min": 1500.0,
573
+ "max": 3250.0
574
+ },
575
+ {
576
+ "current": 3250.0,
577
+ "min": 1500.0,
578
+ "max": 3250.0
579
+ },
580
+ {
581
+ "current": 2300.0,
582
+ "min": 1500.0,
583
+ "max": 3250.0
584
+ },
585
+ {
586
+ "current": 1500.0,
587
+ "min": 1500.0,
588
+ "max": 3250.0
589
+ },
590
+ {
591
+ "current": 2300.0,
592
+ "min": 1500.0,
593
+ "max": 3250.0
594
+ },
595
+ {
596
+ "current": 3250.0,
597
+ "min": 1500.0,
598
+ "max": 3250.0
599
+ },
600
+ {
601
+ "current": 2300.0,
602
+ "min": 1500.0,
603
+ "max": 3250.0
604
+ },
605
+ {
606
+ "current": 3250.0,
607
+ "min": 1500.0,
608
+ "max": 3250.0
609
+ },
610
+ {
611
+ "current": 2300.0,
612
+ "min": 1500.0,
613
+ "max": 3250.0
614
+ },
615
+ {
616
+ "current": 1500.0,
617
+ "min": 1500.0,
618
+ "max": 3250.0
619
+ },
620
+ {
621
+ "current": 3250.0,
622
+ "min": 1500.0,
623
+ "max": 3250.0
624
+ },
625
+ {
626
+ "current": 3250.0,
627
+ "min": 1500.0,
628
+ "max": 3250.0
629
+ },
630
+ {
631
+ "current": 3250.0,
632
+ "min": 1500.0,
633
+ "max": 3250.0
634
+ },
635
+ {
636
+ "current": 3250.0,
637
+ "min": 1500.0,
638
+ "max": 3250.0
639
+ },
640
+ {
641
+ "current": 3250.0,
642
+ "min": 1500.0,
643
+ "max": 3250.0
644
+ },
645
+ {
646
+ "current": 3250.0,
647
+ "min": 1500.0,
648
+ "max": 3250.0
649
+ },
650
+ {
651
+ "current": 3250.0,
652
+ "min": 1500.0,
653
+ "max": 3250.0
654
+ },
655
+ {
656
+ "current": 3250.0,
657
+ "min": 1500.0,
658
+ "max": 3250.0
659
+ },
660
+ {
661
+ "current": 3250.0,
662
+ "min": 1500.0,
663
+ "max": 3250.0
664
+ },
665
+ {
666
+ "current": 3250.0,
667
+ "min": 1500.0,
668
+ "max": 3250.0
669
+ },
670
+ {
671
+ "current": 2300.0,
672
+ "min": 1500.0,
673
+ "max": 3250.0
674
+ },
675
+ {
676
+ "current": 3250.0,
677
+ "min": 1500.0,
678
+ "max": 3250.0
679
+ },
680
+ {
681
+ "current": 3250.0,
682
+ "min": 1500.0,
683
+ "max": 3250.0
684
+ },
685
+ {
686
+ "current": 3250.0,
687
+ "min": 1500.0,
688
+ "max": 3250.0
689
+ },
690
+ {
691
+ "current": 1500.0,
692
+ "min": 1500.0,
693
+ "max": 3250.0
694
+ }
695
+ ],
696
+ "disk": {
697
+ "/": {
698
+ "total": 3519.1512603759766,
699
+ "used": 706.6665191650391
700
+ }
701
+ },
702
+ "gpu": "NVIDIA H100 PCIe",
703
+ "gpu_count": 8,
704
+ "gpu_devices": [
705
+ {
706
+ "name": "NVIDIA H100 PCIe",
707
+ "memory_total": 85520809984
708
+ },
709
+ {
710
+ "name": "NVIDIA H100 PCIe",
711
+ "memory_total": 85520809984
712
+ },
713
+ {
714
+ "name": "NVIDIA H100 PCIe",
715
+ "memory_total": 85520809984
716
+ },
717
+ {
718
+ "name": "NVIDIA H100 PCIe",
719
+ "memory_total": 85520809984
720
+ },
721
+ {
722
+ "name": "NVIDIA H100 PCIe",
723
+ "memory_total": 85520809984
724
+ },
725
+ {
726
+ "name": "NVIDIA H100 PCIe",
727
+ "memory_total": 85520809984
728
+ },
729
+ {
730
+ "name": "NVIDIA H100 PCIe",
731
+ "memory_total": 85520809984
732
+ },
733
+ {
734
+ "name": "NVIDIA H100 PCIe",
735
+ "memory_total": 85520809984
736
+ }
737
+ ],
738
+ "memory": {
739
+ "total": 1505.468677520752
740
+ }
741
+ }
emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_231120-bt4spvmx/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"train_runtime": 0.0134, "train_samples_per_second": 0.0, "train_steps_per_second": 0.0, "total_flos": 0, "train_loss": 0.0, "train/epoch": 0, "train/global_step": 0, "_timestamp": 1754953912.0067096, "_runtime": 31.708322525024414, "_step": 0, "_wandb": {"runtime": 52}}
emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_231120-bt4spvmx/logs/debug.log ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2025-08-11 23:11:20,296 INFO MainThread:94538 [wandb_setup.py:_flush():76] Current SDK version is 0.16.5
2
+ 2025-08-11 23:11:20,296 INFO MainThread:94538 [wandb_setup.py:_flush():76] Configure stats pid to 94538
3
+ 2025-08-11 23:11:20,296 INFO MainThread:94538 [wandb_setup.py:_flush():76] Loading settings from /root/.config/wandb/settings
4
+ 2025-08-11 23:11:20,296 INFO MainThread:94538 [wandb_setup.py:_flush():76] Loading settings from /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/settings
5
+ 2025-08-11 23:11:20,296 WARNING MainThread:94538 [wandb_setup.py:_flush():76] Unknown environment variable: WANDB_KEY
6
+ 2025-08-11 23:11:20,296 INFO MainThread:94538 [wandb_setup.py:_flush():76] Loading settings from environment variables: {}
7
+ 2025-08-11 23:11:20,296 INFO MainThread:94538 [wandb_setup.py:_flush():76] Inferring run settings from compute environment: {'program_relpath': 'llm-scripts/fine-tuning/llama3/train.py', 'program_abspath': '/home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/train.py', 'program': '/home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/train.py'}
8
+ 2025-08-11 23:11:20,296 INFO MainThread:94538 [wandb_setup.py:_flush():76] Applying login settings: {'api_key': '***REDACTED***'}
9
+ 2025-08-11 23:11:20,296 INFO MainThread:94538 [wandb_setup.py:_flush():76] Applying login settings: {'api_key': '***REDACTED***'}
10
+ 2025-08-11 23:11:20,296 INFO MainThread:94538 [wandb_setup.py:_flush():76] Applying login settings: {}
11
+ 2025-08-11 23:11:20,296 INFO MainThread:94538 [wandb_init.py:_log_setup():527] Logging user logs to /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_231120-bt4spvmx/logs/debug.log
12
+ 2025-08-11 23:11:20,296 INFO MainThread:94538 [wandb_init.py:_log_setup():528] Logging internal logs to /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_231120-bt4spvmx/logs/debug-internal.log
13
+ 2025-08-11 23:11:20,296 INFO MainThread:94538 [wandb_init.py:init():567] calling init triggers
14
+ 2025-08-11 23:11:20,296 INFO MainThread:94538 [wandb_init.py:init():574] wandb.init called with sweep_config: {}
15
+ config: {}
16
+ 2025-08-11 23:11:20,296 INFO MainThread:94538 [wandb_init.py:init():617] starting backend
17
+ 2025-08-11 23:11:20,296 INFO MainThread:94538 [wandb_init.py:init():621] setting up manager
18
+ 2025-08-11 23:11:20,297 INFO MainThread:94538 [backend.py:_multiprocessing_setup():105] multiprocessing start_methods=fork,spawn,forkserver, using: spawn
19
+ 2025-08-11 23:11:20,298 INFO MainThread:94538 [wandb_init.py:init():629] backend started and connected
20
+ 2025-08-11 23:11:20,299 INFO MainThread:94538 [wandb_init.py:init():721] updated telemetry
21
+ 2025-08-11 23:11:20,302 INFO MainThread:94538 [wandb_init.py:init():754] communicating run to backend with 90.0 second timeout
22
+ 2025-08-11 23:11:20,534 INFO MainThread:94538 [wandb_run.py:_on_init():2344] communicating current version
23
+ 2025-08-11 23:11:20,561 INFO MainThread:94538 [wandb_run.py:_on_init():2353] got version response upgrade_message: "wandb version 0.21.1 is available! To upgrade, please run:\n $ pip install wandb --upgrade"
24
+
25
+ 2025-08-11 23:11:20,561 INFO MainThread:94538 [wandb_init.py:init():805] starting run threads in backend
26
+ 2025-08-11 23:11:21,360 INFO MainThread:94538 [wandb_run.py:_console_start():2323] atexit reg
27
+ 2025-08-11 23:11:21,360 INFO MainThread:94538 [wandb_run.py:_redirect():2178] redirect: wrap_raw
28
+ 2025-08-11 23:11:21,360 INFO MainThread:94538 [wandb_run.py:_redirect():2243] Wrapping output streams.
29
+ 2025-08-11 23:11:21,360 INFO MainThread:94538 [wandb_run.py:_redirect():2268] Redirects installed.
30
+ 2025-08-11 23:11:21,360 INFO MainThread:94538 [wandb_init.py:init():848] run started, returning control to user process
31
+ 2025-08-11 23:11:51,998 INFO MainThread:94538 [wandb_run.py:_config_callback():1347] config_cb None None {'peft_config': {'default': {'task_type': 'CAUSAL_LM', 'peft_type': <PeftType.LORA: 'LORA'>, 'auto_mapping': None, 'base_model_name_or_path': 'meta-llama/Llama-3.1-8B-Instruct', 'revision': None, 'inference_mode': False, 'r': 16, 'target_modules': {'k_proj', 'v_proj', 'gate_proj', 'q_proj', 'down_proj', 'o_proj', 'up_proj'}, 'exclude_modules': None, 'lora_alpha': 64, 'lora_dropout': 0.05, 'fan_in_fan_out': False, 'bias': 'none', 'use_rslora': False, 'modules_to_save': None, 'init_lora_weights': True, 'layers_to_transform': None, 'layers_pattern': None, 'rank_pattern': {}, 'alpha_pattern': {}, 'megatron_config': None, 'megatron_core': 'megatron.core', 'trainable_token_indices': None, 'loftq_config': {}, 'eva_config': None, 'corda_config': None, 'use_dora': False, 'use_qalora': False, 'qalora_group_size': 16, 'layer_replication': None, 'runtime_config': {'ephemeral_gpu_offload': False}, 'lora_bias': False, 'target_parameters': None}}, 'vocab_size': 128257, 'max_position_embeddings': 131072, 'hidden_size': 4096, 'intermediate_size': 14336, 'num_hidden_layers': 32, 'num_attention_heads': 32, 'num_key_value_heads': 8, 'hidden_act': 'silu', 'initializer_range': 0.02, 'rms_norm_eps': 1e-05, 'pretraining_tp': 1, 'use_cache': True, 'rope_theta': 500000.0, 'rope_scaling': {'factor': 8.0, 'low_freq_factor': 1.0, 'high_freq_factor': 4.0, 'original_max_position_embeddings': 8192, 'rope_type': 'llama3'}, 'attention_bias': False, 'attention_dropout': 0.0, 'mlp_bias': False, 'head_dim': 128, 'return_dict': True, 'output_hidden_states': False, 'torchscript': False, 'torch_dtype': 'float16', 'pruned_heads': {}, 'tie_word_embeddings': False, 'chunk_size_feed_forward': 0, 'is_encoder_decoder': False, 'is_decoder': False, 'cross_attention_hidden_size': None, 'add_cross_attention': False, 'tie_encoder_decoder': False, 'architectures': ['LlamaForCausalLM'], 'finetuning_task': None, 'id2label': {0: 'LABEL_0', 1: 'LABEL_1'}, 'label2id': {'LABEL_0': 0, 'LABEL_1': 1}, 'task_specific_params': None, 'problem_type': None, 'tokenizer_class': None, 'prefix': None, 'bos_token_id': 128000, 'pad_token_id': 128256, 'eos_token_id': [128001, 128008, 128009], 'sep_token_id': None, 'decoder_start_token_id': None, 'max_length': 20, 'min_length': 0, 'do_sample': False, 'early_stopping': False, 'num_beams': 1, 'num_beam_groups': 1, 'diversity_penalty': 0.0, 'temperature': 1.0, 'top_k': 50, 'top_p': 1.0, 'typical_p': 1.0, 'repetition_penalty': 1.0, 'length_penalty': 1.0, 'no_repeat_ngram_size': 0, 'encoder_no_repeat_ngram_size': 0, 'bad_words_ids': None, 'num_return_sequences': 1, 'output_scores': False, 'return_dict_in_generate': False, 'forced_bos_token_id': None, 'forced_eos_token_id': None, 'remove_invalid_values': False, 'exponential_decay_length_penalty': None, 'suppress_tokens': None, 'begin_suppress_tokens': None, '_name_or_path': 'meta-llama/Llama-3.1-8B-Instruct', 'transformers_version': '4.55.0', 'model_type': 'llama', 'tf_legacy_loss': False, 'use_bfloat16': False, 'quantization_config': {'quant_method': 'QuantizationMethod.BITS_AND_BYTES', '_load_in_8bit': True, '_load_in_4bit': False, 'llm_int8_threshold': 6.0, 'llm_int8_skip_modules': None, 'llm_int8_enable_fp32_cpu_offload': False, 'llm_int8_has_fp16_weight': False, 'bnb_4bit_quant_type': 'fp4', 'bnb_4bit_use_double_quant': False, 'bnb_4bit_compute_dtype': 'float32', 'bnb_4bit_quant_storage': 'uint8', 'load_in_4bit': False, 'load_in_8bit': True}, 'output_attentions': False, 'output_dir': 'checkpoints', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': False, 'do_predict': False, 'eval_strategy': 'no', 'prediction_loss_only': False, 'per_device_train_batch_size': 4, 'per_device_eval_batch_size': 8, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 16, 'eval_accumulation_steps': None, 'eval_delay': 0, 'torch_empty_cache_steps': None, 'learning_rate': 0.0002, 'weight_decay': 0.01, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 0.3, 'num_train_epochs': 0, 'max_steps': 0, 'lr_scheduler_type': 'linear', 'lr_scheduler_kwargs': {}, 'warmup_ratio': 0.0, 'warmup_steps': 0, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': 'checkpoints/runs/Aug11_23-11-50_shadecloud', 'logging_strategy': 'steps', 'logging_first_step': False, 'logging_steps': 10, 'logging_nan_inf_filter': True, 'save_strategy': 'epoch', 'save_steps': 99999, 'save_total_limit': None, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'restore_callback_states_from_checkpoint': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 3407, 'data_seed': None, 'jit_mode_eval': False, 'use_ipex': False, 'bf16': False, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': None, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': False, 'eval_steps': None, 'dataloader_num_workers': 0, 'dataloader_prefetch_factor': None, 'past_index': -1, 'run_name': None, 'disable_tqdm': False, 'remove_unused_columns': True, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': {'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None}, 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': 'paged_adamw_8bit', 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['wandb'], 'ddp_find_unused_parameters': False, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': False, 'resume_from_checkpoint': None, 'hub_model_id': None, 'hub_strategy': 'every_save', 'hub_token': '<HUB_TOKEN>', 'hub_private_repo': None, 'hub_always_push': False, 'hub_revision': None, 'gradient_checkpointing': True, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'include_for_metrics': [], 'eval_do_concat_batches': True, 'fp16_backend': 'auto', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': '<PUSH_TO_HUB_TOKEN>', 'mp_parameters': '', 'auto_find_batch_size': True, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 1800, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': False, 'neftune_noise_alpha': None, 'optim_target_modules': None, 'batch_eval_metrics': False, 'eval_on_start': False, 'use_liger_kernel': False, 'liger_kernel_config': None, 'eval_use_gather_object': False, 'average_tokens_across_devices': False, 'model_init_kwargs': None, 'use_liger': False, 'dataset_text_field': 'text', 'dataset_kwargs': None, 'dataset_num_proc': None, 'max_seq_length': 1024, 'packing': False, 'eval_packing': None, 'dataset_batch_size': None, 'num_of_sequences': None, 'chars_per_token': '<CHARS_PER_TOKEN>'}
32
+ 2025-08-11 23:11:52,003 INFO MainThread:94538 [wandb_config.py:__setitem__():151] config set model/num_parameters = 8072212480 - <bound method Run._config_callback of <wandb.sdk.wandb_run.Run object at 0x7f62fdeb0610>>
33
+ 2025-08-11 23:11:52,003 INFO MainThread:94538 [wandb_run.py:_config_callback():1347] config_cb model/num_parameters 8072212480 None
34
+ 2025-08-11 23:12:20,167 WARNING MsgRouterThr:94538 [router.py:message_loop():77] message_loop has been closed
emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233312-jyfpuk9c/run-jyfpuk9c.wandb ADDED
Binary file (5.68 kB). View file
 
emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/config.yaml ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ wandb_version: 1
2
+
3
+ _wandb:
4
+ desc: null
5
+ value:
6
+ python_version: 3.10.12
7
+ cli_version: 0.16.5
8
+ framework: huggingface
9
+ huggingface_version: 4.55.0
10
+ is_jupyter_run: false
11
+ is_kaggle_kernel: false
12
+ start_time: 1754955408.0
13
+ t:
14
+ 1:
15
+ - 1
16
+ - 5
17
+ - 11
18
+ - 41
19
+ - 49
20
+ - 51
21
+ - 53
22
+ - 55
23
+ - 71
24
+ - 84
25
+ - 98
26
+ 2:
27
+ - 1
28
+ - 5
29
+ - 11
30
+ - 41
31
+ - 49
32
+ - 51
33
+ - 53
34
+ - 55
35
+ - 71
36
+ - 84
37
+ - 98
38
+ 3:
39
+ - 15
40
+ - 23
41
+ 4: 3.10.12
42
+ 5: 0.16.5
43
+ 6: 4.55.0
44
+ 8:
45
+ - 5
46
+ 13: linux-x86_64
emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/wandb-summary.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"_wandb": {"runtime": 1}}
emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/logs/debug-internal.log ADDED
@@ -0,0 +1,184 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2025-08-11 23:36:48,180 INFO StreamThr :95897 [internal.py:wandb_internal():86] W&B internal server running at pid: 95897, started at: 2025-08-11 23:36:48.179572
2
+ 2025-08-11 23:36:48,181 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: status
3
+ 2025-08-11 23:36:48,182 INFO WriterThread:95897 [datastore.py:open_for_write():87] open: /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/run-eg3v9sv7.wandb
4
+ 2025-08-11 23:36:48,184 DEBUG SenderThread:95897 [sender.py:send():379] send: header
5
+ 2025-08-11 23:36:48,185 DEBUG SenderThread:95897 [sender.py:send():379] send: run
6
+ 2025-08-11 23:36:48,426 INFO SenderThread:95897 [dir_watcher.py:__init__():211] watching files in: /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files
7
+ 2025-08-11 23:36:48,426 INFO SenderThread:95897 [sender.py:_start_run_threads():1124] run started: eg3v9sv7 with start time 1754955408.179257
8
+ 2025-08-11 23:36:48,431 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: check_version
9
+ 2025-08-11 23:36:48,431 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: check_version
10
+ 2025-08-11 23:36:48,509 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: run_start
11
+ 2025-08-11 23:36:49,081 DEBUG HandlerThread:95897 [system_info.py:__init__():26] System info init
12
+ 2025-08-11 23:36:49,081 DEBUG HandlerThread:95897 [system_info.py:__init__():41] System info init done
13
+ 2025-08-11 23:36:49,081 INFO HandlerThread:95897 [system_monitor.py:start():194] Starting system monitor
14
+ 2025-08-11 23:36:49,082 INFO SystemMonitor:95897 [system_monitor.py:_start():158] Starting system asset monitoring threads
15
+ 2025-08-11 23:36:49,082 INFO HandlerThread:95897 [system_monitor.py:probe():214] Collecting system info
16
+ 2025-08-11 23:36:49,082 INFO SystemMonitor:95897 [interfaces.py:start():190] Started cpu monitoring
17
+ 2025-08-11 23:36:49,083 INFO SystemMonitor:95897 [interfaces.py:start():190] Started disk monitoring
18
+ 2025-08-11 23:36:49,084 INFO SystemMonitor:95897 [interfaces.py:start():190] Started gpu monitoring
19
+ 2025-08-11 23:36:49,084 INFO SystemMonitor:95897 [interfaces.py:start():190] Started memory monitoring
20
+ 2025-08-11 23:36:49,085 INFO SystemMonitor:95897 [interfaces.py:start():190] Started network monitoring
21
+ 2025-08-11 23:36:49,142 DEBUG HandlerThread:95897 [system_info.py:probe():150] Probing system
22
+ 2025-08-11 23:36:49,144 DEBUG HandlerThread:95897 [system_info.py:_probe_git():135] Probing git
23
+ 2025-08-11 23:36:49,149 DEBUG HandlerThread:95897 [system_info.py:_probe_git():143] Probing git done
24
+ 2025-08-11 23:36:49,149 DEBUG HandlerThread:95897 [system_info.py:probe():198] Probing system done
25
+ 2025-08-11 23:36:49,149 DEBUG HandlerThread:95897 [system_monitor.py:probe():223] {'os': 'Linux-5.15.0-151-generic-x86_64-with-glibc2.35', 'python': '3.10.12', 'heartbeatAt': '2025-08-11T23:36:49.142476', 'startedAt': '2025-08-11T23:36:48.176106', 'docker': None, 'cuda': None, 'args': ('--dataset_path', '/home/shadeform/tr-5ekuRmvnwgDznEKHAQcBL2-train.jsonl', '--dataset_id', 'ds-9eYnuJhismAkC4AqzDXuVo', '--test_dataset_path', '/home/shadeform/tr-5ekuRmvnwgDznEKHAQcBL2-test.jsonl', '--test_data_id', 'ds-MLF2XiyMxXD4CPsrLwKYAY', '--service_id', 'ms-DbLTHy7dKWzyFzjvLDENkY', '--training_id', 'tr-Mwx5sYhG3PnojUx9dNq3Bn', '--user_id', 'user_2dNEee5lJORqWKAhGHurdhTLvEQ', '--task_type', 'text-generation', '--model_name', 'python-tab-completion-codellama-70b', '--base_model_link', 'emissary-ai/Python-Tab-Completion-CodeLlama-70b', '--is_external', 'false', '--training_technique', 'SFT'), 'state': 'running', 'program': '/home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/train.py', 'codePathLocal': 'train.py', 'codePath': 'llm-scripts/fine-tuning/llama3/train.py', 'git': {'remote': 'https://coloryourlife:@github.com/Emissary-Tech/emissary-ml.git', 'commit': '0143ec41bec5a001ce9b65ac366aa9ddd6cdc966'}, 'email': None, 'root': '/home/shadeform/emissary-ml', 'host': 'shadecloud', 'username': 'root', 'executable': '/home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/venv/bin/python', 'cpu_count': 64, 'cpu_count_logical': 128, 'cpu_freq': {'current': 2024.2199609375, 'min': 1500.0, 'max': 3250.0}, 'cpu_freq_per_core': [{'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 2300.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 2300.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 2300.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 2300.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3800.214, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 2300.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 2300.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 2300.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 1500.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 2300.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 2300.0, 'min': 1500.0, 'max': 3250.0}, {'current': 2300.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}, {'current': 3250.0, 'min': 1500.0, 'max': 3250.0}], 'disk': {'/': {'total': 3519.1512603759766, 'used': 729.7996559143066}}, 'gpu': 'NVIDIA H100 PCIe', 'gpu_count': 8, 'gpu_devices': [{'name': 'NVIDIA H100 PCIe', 'memory_total': 85520809984}, {'name': 'NVIDIA H100 PCIe', 'memory_total': 85520809984}, {'name': 'NVIDIA H100 PCIe', 'memory_total': 85520809984}, {'name': 'NVIDIA H100 PCIe', 'memory_total': 85520809984}, {'name': 'NVIDIA H100 PCIe', 'memory_total': 85520809984}, {'name': 'NVIDIA H100 PCIe', 'memory_total': 85520809984}, {'name': 'NVIDIA H100 PCIe', 'memory_total': 85520809984}, {'name': 'NVIDIA H100 PCIe', 'memory_total': 85520809984}], 'memory': {'total': 1505.468677520752}}
26
+ 2025-08-11 23:36:49,149 INFO HandlerThread:95897 [system_monitor.py:probe():224] Finished collecting system info
27
+ 2025-08-11 23:36:49,149 INFO HandlerThread:95897 [system_monitor.py:probe():227] Publishing system info
28
+ 2025-08-11 23:36:49,150 INFO HandlerThread:95897 [system_monitor.py:probe():229] Finished publishing system info
29
+ 2025-08-11 23:36:49,152 DEBUG SenderThread:95897 [sender.py:send():379] send: files
30
+ 2025-08-11 23:36:49,152 INFO SenderThread:95897 [sender.py:_save_file():1390] saving file wandb-metadata.json with policy now
31
+ 2025-08-11 23:36:49,292 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: python_packages
32
+ 2025-08-11 23:36:49,293 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: python_packages
33
+ 2025-08-11 23:36:49,293 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: stop_status
34
+ 2025-08-11 23:36:49,294 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: stop_status
35
+ 2025-08-11 23:36:49,296 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: internal_messages
36
+ 2025-08-11 23:36:49,410 DEBUG SenderThread:95897 [sender.py:send():379] send: telemetry
37
+ 2025-08-11 23:36:49,424 INFO wandb-upload_0:95897 [upload_job.py:push():131] Uploaded file /tmp/tmpbvz6x99qwandb/p2ok8soc-wandb-metadata.json
38
+ 2025-08-11 23:36:49,427 INFO Thread-12 :95897 [dir_watcher.py:_on_file_created():271] file/dir created: /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/output.log
39
+ 2025-08-11 23:36:49,427 INFO Thread-12 :95897 [dir_watcher.py:_on_file_created():271] file/dir created: /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/requirements.txt
40
+ 2025-08-11 23:36:49,427 INFO Thread-12 :95897 [dir_watcher.py:_on_file_created():271] file/dir created: /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/wandb-metadata.json
41
+ 2025-08-11 23:36:50,267 DEBUG SenderThread:95897 [sender.py:send():379] send: exit
42
+ 2025-08-11 23:36:50,267 INFO SenderThread:95897 [sender.py:send_exit():586] handling exit code: 0
43
+ 2025-08-11 23:36:50,267 INFO SenderThread:95897 [sender.py:send_exit():588] handling runtime: 1
44
+ 2025-08-11 23:36:50,267 INFO SenderThread:95897 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
45
+ 2025-08-11 23:36:50,267 INFO SenderThread:95897 [sender.py:send_exit():594] send defer
46
+ 2025-08-11 23:36:50,267 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: defer
47
+ 2025-08-11 23:36:50,267 INFO HandlerThread:95897 [handler.py:handle_request_defer():172] handle defer: 0
48
+ 2025-08-11 23:36:50,268 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: defer
49
+ 2025-08-11 23:36:50,268 INFO SenderThread:95897 [sender.py:send_request_defer():610] handle sender defer: 0
50
+ 2025-08-11 23:36:50,268 INFO SenderThread:95897 [sender.py:transition_state():614] send defer: 1
51
+ 2025-08-11 23:36:50,268 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: defer
52
+ 2025-08-11 23:36:50,268 INFO HandlerThread:95897 [handler.py:handle_request_defer():172] handle defer: 1
53
+ 2025-08-11 23:36:50,268 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: defer
54
+ 2025-08-11 23:36:50,268 INFO SenderThread:95897 [sender.py:send_request_defer():610] handle sender defer: 1
55
+ 2025-08-11 23:36:50,268 INFO SenderThread:95897 [sender.py:transition_state():614] send defer: 2
56
+ 2025-08-11 23:36:50,268 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: defer
57
+ 2025-08-11 23:36:50,268 INFO HandlerThread:95897 [handler.py:handle_request_defer():172] handle defer: 2
58
+ 2025-08-11 23:36:50,268 INFO HandlerThread:95897 [system_monitor.py:finish():203] Stopping system monitor
59
+ 2025-08-11 23:36:50,268 DEBUG SystemMonitor:95897 [system_monitor.py:_start():172] Starting system metrics aggregation loop
60
+ 2025-08-11 23:36:50,269 DEBUG SystemMonitor:95897 [system_monitor.py:_start():179] Finished system metrics aggregation loop
61
+ 2025-08-11 23:36:50,269 DEBUG SystemMonitor:95897 [system_monitor.py:_start():183] Publishing last batch of metrics
62
+ 2025-08-11 23:36:50,269 INFO HandlerThread:95897 [interfaces.py:finish():202] Joined cpu monitor
63
+ 2025-08-11 23:36:50,270 INFO HandlerThread:95897 [interfaces.py:finish():202] Joined disk monitor
64
+ 2025-08-11 23:36:50,427 INFO Thread-12 :95897 [dir_watcher.py:_on_file_created():271] file/dir created: /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/wandb-summary.json
65
+ 2025-08-11 23:36:51,428 INFO Thread-12 :95897 [dir_watcher.py:_on_file_modified():288] file/dir modified: /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/output.log
66
+ 2025-08-11 23:36:51,457 INFO HandlerThread:95897 [interfaces.py:finish():202] Joined gpu monitor
67
+ 2025-08-11 23:36:51,457 INFO HandlerThread:95897 [interfaces.py:finish():202] Joined memory monitor
68
+ 2025-08-11 23:36:51,457 INFO HandlerThread:95897 [interfaces.py:finish():202] Joined network monitor
69
+ 2025-08-11 23:36:51,458 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: poll_exit
70
+ 2025-08-11 23:36:51,459 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: defer
71
+ 2025-08-11 23:36:51,459 INFO SenderThread:95897 [sender.py:send_request_defer():610] handle sender defer: 2
72
+ 2025-08-11 23:36:51,459 INFO SenderThread:95897 [sender.py:transition_state():614] send defer: 3
73
+ 2025-08-11 23:36:51,459 DEBUG SenderThread:95897 [sender.py:send():379] send: stats
74
+ 2025-08-11 23:36:51,459 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: poll_exit
75
+ 2025-08-11 23:36:51,460 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: defer
76
+ 2025-08-11 23:36:51,460 INFO HandlerThread:95897 [handler.py:handle_request_defer():172] handle defer: 3
77
+ 2025-08-11 23:36:51,460 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: defer
78
+ 2025-08-11 23:36:51,461 INFO SenderThread:95897 [sender.py:send_request_defer():610] handle sender defer: 3
79
+ 2025-08-11 23:36:51,461 INFO SenderThread:95897 [sender.py:transition_state():614] send defer: 4
80
+ 2025-08-11 23:36:51,461 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: defer
81
+ 2025-08-11 23:36:51,461 INFO HandlerThread:95897 [handler.py:handle_request_defer():172] handle defer: 4
82
+ 2025-08-11 23:36:51,461 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: defer
83
+ 2025-08-11 23:36:51,461 INFO SenderThread:95897 [sender.py:send_request_defer():610] handle sender defer: 4
84
+ 2025-08-11 23:36:51,461 INFO SenderThread:95897 [sender.py:transition_state():614] send defer: 5
85
+ 2025-08-11 23:36:51,462 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: defer
86
+ 2025-08-11 23:36:51,462 INFO HandlerThread:95897 [handler.py:handle_request_defer():172] handle defer: 5
87
+ 2025-08-11 23:36:51,462 DEBUG SenderThread:95897 [sender.py:send():379] send: summary
88
+ 2025-08-11 23:36:51,463 INFO SenderThread:95897 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
89
+ 2025-08-11 23:36:51,463 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: defer
90
+ 2025-08-11 23:36:51,463 INFO SenderThread:95897 [sender.py:send_request_defer():610] handle sender defer: 5
91
+ 2025-08-11 23:36:51,463 INFO SenderThread:95897 [sender.py:transition_state():614] send defer: 6
92
+ 2025-08-11 23:36:51,463 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: defer
93
+ 2025-08-11 23:36:51,464 INFO HandlerThread:95897 [handler.py:handle_request_defer():172] handle defer: 6
94
+ 2025-08-11 23:36:51,464 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: defer
95
+ 2025-08-11 23:36:51,464 INFO SenderThread:95897 [sender.py:send_request_defer():610] handle sender defer: 6
96
+ 2025-08-11 23:36:51,469 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: status_report
97
+ 2025-08-11 23:36:51,540 INFO SenderThread:95897 [sender.py:transition_state():614] send defer: 7
98
+ 2025-08-11 23:36:51,541 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: defer
99
+ 2025-08-11 23:36:51,541 INFO HandlerThread:95897 [handler.py:handle_request_defer():172] handle defer: 7
100
+ 2025-08-11 23:36:51,541 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: defer
101
+ 2025-08-11 23:36:51,541 INFO SenderThread:95897 [sender.py:send_request_defer():610] handle sender defer: 7
102
+ 2025-08-11 23:36:52,268 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: poll_exit
103
+ 2025-08-11 23:36:52,428 INFO Thread-12 :95897 [dir_watcher.py:_on_file_modified():288] file/dir modified: /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/output.log
104
+ 2025-08-11 23:36:52,429 INFO Thread-12 :95897 [dir_watcher.py:_on_file_modified():288] file/dir modified: /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/config.yaml
105
+ 2025-08-11 23:36:52,429 INFO Thread-12 :95897 [dir_watcher.py:_on_file_modified():288] file/dir modified: /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/wandb-summary.json
106
+ 2025-08-11 23:36:54,031 INFO SenderThread:95897 [sender.py:transition_state():614] send defer: 8
107
+ 2025-08-11 23:36:54,031 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: poll_exit
108
+ 2025-08-11 23:36:54,032 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: defer
109
+ 2025-08-11 23:36:54,032 INFO HandlerThread:95897 [handler.py:handle_request_defer():172] handle defer: 8
110
+ 2025-08-11 23:36:54,033 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: defer
111
+ 2025-08-11 23:36:54,033 INFO SenderThread:95897 [sender.py:send_request_defer():610] handle sender defer: 8
112
+ 2025-08-11 23:36:54,033 INFO SenderThread:95897 [job_builder.py:build():318] Attempting to build job artifact
113
+ 2025-08-11 23:36:54,033 INFO SenderThread:95897 [job_builder.py:_get_source_type():455] is repo sourced job
114
+ 2025-08-11 23:36:54,060 INFO SenderThread:95897 [job_builder.py:build():431] adding wandb-job metadata file
115
+ 2025-08-11 23:36:54,063 INFO SenderThread:95897 [sender.py:transition_state():614] send defer: 9
116
+ 2025-08-11 23:36:54,064 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: defer
117
+ 2025-08-11 23:36:54,064 DEBUG SenderThread:95897 [sender.py:send():379] send: artifact
118
+ 2025-08-11 23:36:54,064 INFO HandlerThread:95897 [handler.py:handle_request_defer():172] handle defer: 9
119
+ 2025-08-11 23:36:54,271 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: poll_exit
120
+ 2025-08-11 23:36:54,350 INFO SenderThread:95897 [sender.py:send_artifact():1468] sent artifact job-https___coloryourlife__github.com_Emissary-Tech_emissary-ml.git_llm-scripts_fine-tuning_llama3_train.py - {'id': 'QXJ0aWZhY3Q6MTk0ODg5MzA0Nw==', 'state': 'COMMITTED', 'artifactSequence': {'id': 'QXJ0aWZhY3RDb2xsZWN0aW9uOjcxMTAwMjM0OQ==', 'latestArtifact': {'id': 'QXJ0aWZhY3Q6MTk0ODg5MzA0Nw==', 'versionIndex': 18}}}
121
+ 2025-08-11 23:36:54,350 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: defer
122
+ 2025-08-11 23:36:54,350 INFO SenderThread:95897 [sender.py:send_request_defer():610] handle sender defer: 9
123
+ 2025-08-11 23:36:54,350 INFO SenderThread:95897 [dir_watcher.py:finish():358] shutting down directory watcher
124
+ 2025-08-11 23:36:54,430 INFO Thread-12 :95897 [dir_watcher.py:_on_file_modified():288] file/dir modified: /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/output.log
125
+ 2025-08-11 23:36:54,431 INFO SenderThread:95897 [dir_watcher.py:finish():388] scan: /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files
126
+ 2025-08-11 23:36:54,431 INFO SenderThread:95897 [dir_watcher.py:finish():402] scan save: /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/output.log output.log
127
+ 2025-08-11 23:36:54,431 INFO SenderThread:95897 [dir_watcher.py:finish():402] scan save: /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/wandb-metadata.json wandb-metadata.json
128
+ 2025-08-11 23:36:54,431 INFO SenderThread:95897 [dir_watcher.py:finish():402] scan save: /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/config.yaml config.yaml
129
+ 2025-08-11 23:36:54,432 INFO SenderThread:95897 [dir_watcher.py:finish():402] scan save: /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/requirements.txt requirements.txt
130
+ 2025-08-11 23:36:54,434 INFO SenderThread:95897 [dir_watcher.py:finish():402] scan save: /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/wandb-summary.json wandb-summary.json
131
+ 2025-08-11 23:36:54,438 INFO SenderThread:95897 [sender.py:transition_state():614] send defer: 10
132
+ 2025-08-11 23:36:54,438 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: poll_exit
133
+ 2025-08-11 23:36:54,441 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: defer
134
+ 2025-08-11 23:36:54,441 INFO HandlerThread:95897 [handler.py:handle_request_defer():172] handle defer: 10
135
+ 2025-08-11 23:36:54,444 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: defer
136
+ 2025-08-11 23:36:54,444 INFO SenderThread:95897 [sender.py:send_request_defer():610] handle sender defer: 10
137
+ 2025-08-11 23:36:54,444 INFO SenderThread:95897 [file_pusher.py:finish():172] shutting down file pusher
138
+ 2025-08-11 23:36:54,622 INFO wandb-upload_0:95897 [upload_job.py:push():131] Uploaded file /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/output.log
139
+ 2025-08-11 23:36:54,640 INFO wandb-upload_1:95897 [upload_job.py:push():131] Uploaded file /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/config.yaml
140
+ 2025-08-11 23:36:54,650 INFO wandb-upload_2:95897 [upload_job.py:push():131] Uploaded file /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/requirements.txt
141
+ 2025-08-11 23:36:54,667 INFO wandb-upload_3:95897 [upload_job.py:push():131] Uploaded file /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/files/wandb-summary.json
142
+ 2025-08-11 23:36:54,867 INFO Thread-11 (_thread_body):95897 [sender.py:transition_state():614] send defer: 11
143
+ 2025-08-11 23:36:54,868 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: defer
144
+ 2025-08-11 23:36:54,868 INFO HandlerThread:95897 [handler.py:handle_request_defer():172] handle defer: 11
145
+ 2025-08-11 23:36:54,869 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: defer
146
+ 2025-08-11 23:36:54,869 INFO SenderThread:95897 [sender.py:send_request_defer():610] handle sender defer: 11
147
+ 2025-08-11 23:36:54,869 INFO SenderThread:95897 [file_pusher.py:join():178] waiting for file pusher
148
+ 2025-08-11 23:36:54,869 INFO SenderThread:95897 [sender.py:transition_state():614] send defer: 12
149
+ 2025-08-11 23:36:54,870 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: defer
150
+ 2025-08-11 23:36:54,870 INFO HandlerThread:95897 [handler.py:handle_request_defer():172] handle defer: 12
151
+ 2025-08-11 23:36:54,870 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: defer
152
+ 2025-08-11 23:36:54,870 INFO SenderThread:95897 [sender.py:send_request_defer():610] handle sender defer: 12
153
+ 2025-08-11 23:36:54,870 INFO SenderThread:95897 [file_stream.py:finish():614] file stream finish called
154
+ 2025-08-11 23:36:54,948 INFO SenderThread:95897 [file_stream.py:finish():618] file stream finish is done
155
+ 2025-08-11 23:36:54,948 INFO SenderThread:95897 [sender.py:transition_state():614] send defer: 13
156
+ 2025-08-11 23:36:54,948 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: defer
157
+ 2025-08-11 23:36:54,948 INFO HandlerThread:95897 [handler.py:handle_request_defer():172] handle defer: 13
158
+ 2025-08-11 23:36:54,949 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: defer
159
+ 2025-08-11 23:36:54,949 INFO SenderThread:95897 [sender.py:send_request_defer():610] handle sender defer: 13
160
+ 2025-08-11 23:36:54,949 INFO SenderThread:95897 [sender.py:transition_state():614] send defer: 14
161
+ 2025-08-11 23:36:54,949 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: defer
162
+ 2025-08-11 23:36:54,950 INFO HandlerThread:95897 [handler.py:handle_request_defer():172] handle defer: 14
163
+ 2025-08-11 23:36:54,950 DEBUG SenderThread:95897 [sender.py:send():379] send: final
164
+ 2025-08-11 23:36:54,950 DEBUG SenderThread:95897 [sender.py:send():379] send: footer
165
+ 2025-08-11 23:36:54,950 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: defer
166
+ 2025-08-11 23:36:54,950 INFO SenderThread:95897 [sender.py:send_request_defer():610] handle sender defer: 14
167
+ 2025-08-11 23:36:54,951 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: poll_exit
168
+ 2025-08-11 23:36:54,951 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: poll_exit
169
+ 2025-08-11 23:36:54,952 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: poll_exit
170
+ 2025-08-11 23:36:54,952 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: poll_exit
171
+ 2025-08-11 23:36:54,953 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: server_info
172
+ 2025-08-11 23:36:54,953 DEBUG SenderThread:95897 [sender.py:send_request():406] send_request: server_info
173
+ 2025-08-11 23:36:54,956 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: get_summary
174
+ 2025-08-11 23:36:54,956 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: sampled_history
175
+ 2025-08-11 23:36:54,957 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: internal_messages
176
+ 2025-08-11 23:36:55,000 INFO MainThread:95897 [wandb_run.py:_footer_history_summary_info():3920] rendering history
177
+ 2025-08-11 23:36:55,000 INFO MainThread:95897 [wandb_run.py:_footer_history_summary_info():3952] rendering summary
178
+ 2025-08-11 23:36:55,000 INFO MainThread:95897 [wandb_run.py:_footer_sync_info():3879] logging synced files
179
+ 2025-08-11 23:36:55,001 DEBUG HandlerThread:95897 [handler.py:handle_request():146] handle_request: shutdown
180
+ 2025-08-11 23:36:55,001 INFO HandlerThread:95897 [handler.py:finish():866] shutting down handler
181
+ 2025-08-11 23:36:55,953 INFO WriterThread:95897 [datastore.py:close():296] close: /home/shadeform/emissary-ml/llm-scripts/fine-tuning/llama3/wandb/run-20250811_233648-eg3v9sv7/run-eg3v9sv7.wandb
182
+ 2025-08-11 23:36:56,000 INFO SenderThread:95897 [sender.py:finish():1546] shutting down sender
183
+ 2025-08-11 23:36:56,000 INFO SenderThread:95897 [file_pusher.py:finish():172] shutting down file pusher
184
+ 2025-08-11 23:36:56,000 INFO SenderThread:95897 [file_pusher.py:join():178] waiting for file pusher