Minor Fixes for GPU training

This commit is contained in:
Clemens-Dautermann 2020-01-28 15:23:25 +01:00
parent 56ee2635b5
commit 459caccfe2
47 changed files with 9862 additions and 26 deletions

View file

@ -0,0 +1,9 @@
wandb_version: 1
_wandb:
desc: null
value:
cli_version: 0.8.22
framework: torch
is_jupyter_run: false
python_version: 3.6.9

File diff suppressed because one or more lines are too long

View file

@ -0,0 +1,6 @@
{"system.gpu.0.gpu": 0.13, "system.gpu.0.memory": 0.47, "system.gpu.0.memoryAllocated": 9.46, "system.gpu.0.temp": 36.47, "system.gpu.0.powerWatts": 23.7, "system.gpu.0.powerPercent": 13.17, "system.cpu": 19.22, "system.memory": 24.46, "system.disk": 4.8, "system.proc.memory.availableMB": 6038.16, "system.proc.memory.rssMB": 1338.85, "system.proc.memory.percent": 16.75, "system.proc.cpu.threads": 4.67, "system.network.sent": 44593, "system.network.recv": 74352, "_wandb": true, "_timestamp": 1580219360, "_runtime": 29}
{"system.gpu.0.gpu": 0.0, "system.gpu.0.memory": 2.93, "system.gpu.0.memoryAllocated": 11.54, "system.gpu.0.temp": 36.07, "system.gpu.0.powerWatts": 10.74, "system.gpu.0.powerPercent": 5.97, "system.cpu": 25.42, "system.memory": 28.08, "system.disk": 4.8, "system.proc.memory.availableMB": 5748.53, "system.proc.memory.rssMB": 1672.29, "system.proc.memory.percent": 20.92, "system.proc.cpu.threads": 5.0, "system.network.sent": 117452, "system.network.recv": 102403, "_wandb": true, "_timestamp": 1580219390, "_runtime": 59}
{"system.gpu.0.gpu": 0.0, "system.gpu.0.memory": 3.0, "system.gpu.0.memoryAllocated": 11.54, "system.gpu.0.temp": 36.0, "system.gpu.0.powerWatts": 10.73, "system.gpu.0.powerPercent": 5.96, "system.cpu": 25.37, "system.memory": 28.18, "system.disk": 4.8, "system.proc.memory.availableMB": 5740.19, "system.proc.memory.rssMB": 1680.61, "system.proc.memory.percent": 21.03, "system.proc.cpu.threads": 5.0, "system.network.sent": 194239, "system.network.recv": 133076, "_wandb": true, "_timestamp": 1580219420, "_runtime": 89}
{"system.gpu.0.gpu": 0.0, "system.gpu.0.memory": 3.0, "system.gpu.0.memoryAllocated": 11.54, "system.gpu.0.temp": 36.0, "system.gpu.0.powerWatts": 10.71, "system.gpu.0.powerPercent": 5.95, "system.cpu": 25.38, "system.memory": 28.29, "system.disk": 4.8, "system.proc.memory.availableMB": 5731.83, "system.proc.memory.rssMB": 1688.87, "system.proc.memory.percent": 21.13, "system.proc.cpu.threads": 5.0, "system.network.sent": 276894, "system.network.recv": 159761, "_wandb": true, "_timestamp": 1580219450, "_runtime": 119}
{"system.gpu.0.gpu": 0.0, "system.gpu.0.memory": 3.0, "system.gpu.0.memoryAllocated": 11.54, "system.gpu.0.temp": 36.0, "system.gpu.0.powerWatts": 10.7, "system.gpu.0.powerPercent": 5.95, "system.cpu": 25.45, "system.memory": 28.39, "system.disk": 4.8, "system.proc.memory.availableMB": 5723.41, "system.proc.memory.rssMB": 1697.12, "system.proc.memory.percent": 21.23, "system.proc.cpu.threads": 5.0, "system.network.sent": 366397, "system.network.recv": 193956, "_wandb": true, "_timestamp": 1580219480, "_runtime": 149}
{"system.gpu.0.gpu": 0.0, "system.gpu.0.memory": 3.0, "system.gpu.0.memoryAllocated": 11.54, "system.gpu.0.temp": 36.0, "system.gpu.0.powerWatts": 10.74, "system.gpu.0.powerPercent": 5.97, "system.cpu": 23.1, "system.memory": 28.45, "system.disk": 4.8, "system.proc.memory.availableMB": 5718.97, "system.proc.memory.rssMB": 1701.61, "system.proc.memory.percent": 21.29, "system.proc.cpu.threads": 5.0, "system.network.sent": 374068, "system.network.recv": 196093, "_wandb": true, "_timestamp": 1580219483, "_runtime": 152}

View file

@ -0,0 +1,25 @@
{
"root": "/home/clemens/Dokumente/repos/pytorch-ai",
"program": "pytorch_ai.py",
"git": {
"remote": "git@github.com:Clemens-Dautermann/pytorch-ai.git",
"commit": "56ee2635b5fec0a3976a4e7ddc55a89d4dea93bc"
},
"email": "clemens.dautermann@t-online.de",
"startedAt": "2020-01-28T13:48:51.143809",
"host": "clemens-ubuntu",
"username": "clemens",
"executable": "/usr/bin/python3",
"os": "Linux-4.15.0-58-generic-x86_64-with-Ubuntu-18.04-bionic",
"python": "3.6.9",
"gpu": "GeForce GTX 960",
"gpu_count": 1,
"cpu_count": 4,
"args": [],
"state": "killed",
"jobType": null,
"mode": "dryrun",
"project": "tictactoe",
"heartbeatAt": "2020-01-28T13:51:24.194431",
"exitcode": 255
}