-
Notifications
You must be signed in to change notification settings - Fork 21
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Merge pull request #215 from InnopolisUni/system_monitoring
System monitoring
- Loading branch information
Showing
18 changed files
with
482 additions
and
20 deletions.
There are no files selected for viewing
File renamed without changes.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
21 changes: 21 additions & 0 deletions
21
config/experiments/semantic-segmentation/KG_041223_ingieq921_unet.yaml
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,21 @@ | ||
# @package _global_ | ||
defaults: | ||
- override /models: semantic-segmentation/unet_smp.yaml | ||
- override /datasets: semantic-segmentation/segmentation_arable.yaml | ||
- override /optimizers: adam.yaml | ||
- override /losses: segmentation_losses | ||
|
||
trainers: | ||
overfit_batches: 20 # fit only 20 val batches and 40 train batches | ||
|
||
accelerator: gpu | ||
|
||
models: | ||
in_channels: 4 | ||
|
||
|
||
project: "segmentation" | ||
task: "image-segmentation" | ||
random_seed: 42 | ||
weights_freq: 1 | ||
batch_size: 10 |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,39 @@ | ||
#!/bin/bash | ||
# run like this: sudo -E env "PATH=$PATH" bash examples/measure_image_classification.sh | ||
sudo apt-get install -y iotop > /dev/null | ||
PWD=$(pwd) | ||
|
||
current_dir=${PWD##*/} | ||
|
||
var2="examples" | ||
if [ "$current_dir" = "$var2" ]; then | ||
cd .. | ||
fi | ||
echo "" > nohup.out | ||
echo "" > nvidiasmi_log | ||
echo "" > mem_log | ||
echo "" > cpu_log | ||
|
||
export NO_CLI=True | ||
|
||
INITIAL_PROCESSES=$(sudo lsof nohup.out | wc -l) && echo $INITIAL_PROCESSES | ||
|
||
|
||
nohup time sudo -E env "PATH=$PATH" python train.py experiments=anomaly-detection/IM_040822_rbe23lls_anomaly_detection_timeseries_lstm.yaml epochs=100 optimizers=adam accelerator=gpu & | ||
PID=$! | ||
echo "Saving cpu+ram info and nvidia-smi to cpu_log + mem_log and nvidiasmi_log" | ||
echo $PID | ||
|
||
PROCESSES=$(sudo lsof nohup.out | wc -l) && echo $PROCESSES | ||
while [ $PROCESSES -gt $INITIAL_PROCESSES ] | ||
do | ||
top -b n1 | grep -E 'Cpu' >> cpu_log | ||
top -b n1 | grep -E 'MiB Mem' >> mem_log | ||
sudo nvidia-smi --query-gpu=timestamp,name,pci.bus_id,driver_version,pstate,pcie.link.gen.max,pcie.link.gen.current,temperature.gpu,utilization.gpu,utilization.memory,memory.total,memory.free,memory.used --format=csv | grep "00000000:25:00.0" >> nvidiasmi_log | ||
sleep 1 | ||
PROCESSES=$(sudo lsof nohup.out | wc -l) # && echo $PROCESSES | ||
done | ||
|
||
sudo -E env "PATH=$PATH" python examples/measurements_compaction.py | ||
|
||
sudo kill -9 $PID |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,42 @@ | ||
#!/bin/bash | ||
# run like this: sudo -E env "PATH=$PATH" bash examples/measure_image_classification.sh | ||
sudo apt-get install -y iotop > /dev/null | ||
PWD=$(pwd) | ||
|
||
current_dir=${PWD##*/} | ||
|
||
var2="examples" | ||
if [ "$current_dir" = "$var2" ]; then | ||
cd .. | ||
fi | ||
echo "" > nohup.out | ||
echo "" > nvidiasmi_log | ||
echo "" > mem_log | ||
echo "" > cpu_log | ||
|
||
export NO_CLI=True | ||
|
||
INITIAL_PROCESSES=$(sudo lsof nohup.out | wc -l) && echo $INITIAL_PROCESSES | ||
|
||
|
||
nohup time sudo -E env "PATH=$PATH" python innofw/utils/data_utils/preprocessing/band_composer.py\ | ||
--src_type sentinel2\ | ||
--src_path tests/data/images/other/satellite_cropped/sentinel2/one\ | ||
--channels "[\"RED\", \"GRN\", \"BLU\", \"NIR\"]" & | ||
PID=$! | ||
echo "Saving cpu+ram info and nvidia-smi to cpu_log + mem_log and nvidiasmi_log" | ||
echo $PID | ||
|
||
PROCESSES=$(sudo lsof nohup.out | wc -l) && echo $PROCESSES | ||
while [ $PROCESSES -gt $INITIAL_PROCESSES ] | ||
do | ||
top -b n1 | grep -E 'Cpu' >> cpu_log | ||
top -b n1 | grep -E 'MiB Mem' >> mem_log | ||
sudo nvidia-smi --query-gpu=timestamp,name,pci.bus_id,driver_version,pstate,pcie.link.gen.max,pcie.link.gen.current,temperature.gpu,utilization.gpu,utilization.memory,memory.total,memory.free,memory.used --format=csv | grep "00000000:25:00.0" >> nvidiasmi_log | ||
sleep 1 | ||
PROCESSES=$(sudo lsof nohup.out | wc -l) # && echo $PROCESSES | ||
done | ||
|
||
sudo -E env "PATH=$PATH" python examples/measurements_compaction.py | ||
|
||
sudo kill -9 $PID |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,32 @@ | ||
#!/bin/bash | ||
# run like this: sudo -E env "PATH=$PATH" bash examples/measure_image_classification.sh | ||
sudo apt-get install -y iotop > /dev/null | ||
PWD=$(pwd) | ||
|
||
current_dir=${PWD##*/} | ||
|
||
var2="examples" | ||
if [ "$current_dir" = "$var2" ]; then | ||
cd .. | ||
fi | ||
echo "" > nohup.out | ||
echo "" > nvidiasmi_log | ||
echo "" > mem_log | ||
echo "" > cpu_log | ||
|
||
export NO_CLI=True | ||
|
||
nohup time sudo -E env "PATH=$PATH" python train.py experiments=detection/KA_120722_8adfcdaa_yolov5.yaml epochs=100 optimizers=adam accelerator=gpu & | ||
PID=$! | ||
echo "Saving cpu+ram info and nvidia-smi to cpu_log+mem_log and nvidiasmi_log" | ||
echo $PID | ||
|
||
while true | ||
do | ||
top -b n1 | grep -E 'Cpu' >> cpu_log | ||
top -b n1 | grep -E 'MiB Mem' >> mem_log | ||
sudo nvidia-smi --query-gpu=timestamp,name,pci.bus_id,driver_version,pstate,pcie.link.gen.max,pcie.link.gen.current,temperature.gpu,utilization.gpu,utilization.memory,memory.total,memory.free,memory.used --format=csv >> nvidiasmi_log | ||
sleep 1 | ||
done | ||
|
||
kill $PID |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,39 @@ | ||
#!/bin/bash | ||
# run like this: sudo -E env "PATH=$PATH" bash examples/measure_image_classification.sh | ||
sudo apt-get install -y iotop > /dev/null | ||
PWD=$(pwd) | ||
|
||
current_dir=${PWD##*/} | ||
|
||
var2="examples" | ||
if [ "$current_dir" = "$var2" ]; then | ||
cd .. | ||
fi | ||
echo "" > nohup.out | ||
echo "" > nvidiasmi_log | ||
echo "" > mem_log | ||
echo "" > cpu_log | ||
|
||
export NO_CLI=True | ||
|
||
INITIAL_PROCESSES=$(sudo lsof nohup.out | wc -l) && echo $INITIAL_PROCESSES | ||
|
||
|
||
nohup time sudo -E env "PATH=$PATH" python train.py experiments=classification/KG_090323_wpng92_mnist.yaml epochs=100 & | ||
PID=$! | ||
echo "Saving cpu+ram info and nvidia-smi to cpu_log + mem_log and nvidiasmi_log" | ||
echo $PID | ||
|
||
PROCESSES=$(sudo lsof nohup.out | wc -l) && echo $PROCESSES | ||
while [ $PROCESSES -gt $INITIAL_PROCESSES ] | ||
do | ||
top -b n1 | grep -E 'Cpu' >> cpu_log | ||
top -b n1 | grep -E 'MiB Mem' >> mem_log | ||
sudo nvidia-smi --query-gpu=timestamp,name,pci.bus_id,driver_version,pstate,pcie.link.gen.max,pcie.link.gen.current,temperature.gpu,utilization.gpu,utilization.memory,memory.total,memory.free,memory.used --format=csv | grep "00000000:25:00.0" >> nvidiasmi_log | ||
sleep 1 | ||
PROCESSES=$(sudo lsof nohup.out | wc -l) # && echo $PROCESSES | ||
done | ||
|
||
sudo -E env "PATH=$PATH" python examples/measurements_compaction.py | ||
|
||
sudo kill -9 $PID |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,39 @@ | ||
#!/bin/bash | ||
# run like this: sudo -E env "PATH=$PATH" bash examples/measure_image_classification.sh | ||
sudo apt-get install -y iotop > /dev/null | ||
PWD=$(pwd) | ||
|
||
current_dir=${PWD##*/} | ||
|
||
var2="examples" | ||
if [ "$current_dir" = "$var2" ]; then | ||
cd .. | ||
fi | ||
echo "" > nohup.out | ||
echo "" > nvidiasmi_log | ||
echo "" > mem_log | ||
echo "" > cpu_log | ||
|
||
export NO_CLI=True | ||
|
||
INITIAL_PROCESSES=$(sudo lsof nohup.out | wc -l) && echo $INITIAL_PROCESSES | ||
|
||
|
||
nohup time sudo -E env "PATH=$PATH" python train.py experiments=regression/KA_130722_9f7134db_linear_regression.yaml & | ||
PID=$! | ||
echo "Saving cpu+ram info and nvidia-smi to cpu_log + mem_log and nvidiasmi_log" | ||
echo $PID | ||
|
||
PROCESSES=$(sudo lsof nohup.out | wc -l) && echo $PROCESSES | ||
while [ $PROCESSES -gt $INITIAL_PROCESSES ] | ||
do | ||
top -b n1 | grep -E 'Cpu' >> cpu_log | ||
top -b n1 | grep -E 'MiB Mem' >> mem_log | ||
sudo nvidia-smi --query-gpu=timestamp,name,pci.bus_id,driver_version,pstate,pcie.link.gen.max,pcie.link.gen.current,temperature.gpu,utilization.gpu,utilization.memory,memory.total,memory.free,memory.used --format=csv | grep "00000000:25:00.0" >> nvidiasmi_log | ||
sleep 1 | ||
PROCESSES=$(sudo lsof nohup.out | wc -l) # && echo $PROCESSES | ||
done | ||
|
||
sudo -E env "PATH=$PATH" python examples/measurements_compaction.py | ||
|
||
sudo kill -9 $PID |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,39 @@ | ||
#!/bin/bash | ||
# run like this: sudo -E env "PATH=$PATH" bash examples/measure_image_classification.sh | ||
sudo apt-get install -y iotop > /dev/null | ||
PWD=$(pwd) | ||
|
||
current_dir=${PWD##*/} | ||
|
||
var2="examples" | ||
if [ "$current_dir" = "$var2" ]; then | ||
cd .. | ||
fi | ||
echo "" > nohup.out | ||
echo "" > nvidiasmi_log | ||
echo "" > mem_log | ||
echo "" > cpu_log | ||
|
||
export NO_CLI=True | ||
|
||
INITIAL_PROCESSES=$(sudo lsof nohup.out | wc -l) && echo $INITIAL_PROCESSES | ||
|
||
|
||
nohup time sudo -E env "PATH=$PATH" python train.py experiments=one-shot-learning/IM_190722_vwer3f23_oneshotlearning.yaml & | ||
PID=$! | ||
echo "Saving cpu+ram info and nvidia-smi to cpu_log + mem_log and nvidiasmi_log" | ||
echo $PID | ||
|
||
PROCESSES=$(sudo lsof nohup.out | wc -l) && echo $PROCESSES | ||
while [ $PROCESSES -gt $INITIAL_PROCESSES ] | ||
do | ||
top -b n1 | grep -E 'Cpu' >> cpu_log | ||
top -b n1 | grep -E 'MiB Mem' >> mem_log | ||
sudo nvidia-smi --query-gpu=timestamp,name,pci.bus_id,driver_version,pstate,pcie.link.gen.max,pcie.link.gen.current,temperature.gpu,utilization.gpu,utilization.memory,memory.total,memory.free,memory.used --format=csv | grep "00000000:25:00.0" >> nvidiasmi_log | ||
sleep 1 | ||
PROCESSES=$(sudo lsof nohup.out | wc -l) # && echo $PROCESSES | ||
done | ||
|
||
sudo -E env "PATH=$PATH" python examples/measurements_compaction.py | ||
|
||
sudo kill -9 $PID |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,39 @@ | ||
#!/bin/bash | ||
# run like this: sudo -E env "PATH=$PATH" bash examples/measure_image_classification.sh | ||
sudo apt-get install -y iotop > /dev/null | ||
PWD=$(pwd) | ||
|
||
current_dir=${PWD##*/} | ||
|
||
var2="examples" | ||
if [ "$current_dir" = "$var2" ]; then | ||
cd .. | ||
fi | ||
echo "" > nohup.out | ||
echo "" > nvidiasmi_log | ||
echo "" > mem_log | ||
echo "" > cpu_log | ||
|
||
export NO_CLI=True | ||
|
||
INITIAL_PROCESSES=$(sudo lsof nohup.out | wc -l) && echo $INITIAL_PROCESSES | ||
|
||
|
||
nohup time sudo -E env "PATH=$PATH" python train.py experiments=semantic-segmentation/KG_041223_ingieq921_unet.yaml epochs=100 optimizers=adam accelerator=gpu & | ||
PID=$! | ||
echo "Saving cpu+ram info and nvidia-smi to cpu_log + mem_log and nvidiasmi_log" | ||
echo $PID | ||
|
||
PROCESSES=$(sudo lsof nohup.out | wc -l) && echo $PROCESSES | ||
while [ $PROCESSES -gt $INITIAL_PROCESSES ] | ||
do | ||
top -b n1 | grep -E 'Cpu' >> cpu_log | ||
top -b n1 | grep -E 'MiB Mem' >> mem_log | ||
sudo nvidia-smi --query-gpu=timestamp,name,pci.bus_id,driver_version,pstate,pcie.link.gen.max,pcie.link.gen.current,temperature.gpu,utilization.gpu,utilization.memory,memory.total,memory.free,memory.used --format=csv | grep "00000000:25:00.0" >> nvidiasmi_log | ||
sleep 1 | ||
PROCESSES=$(sudo lsof nohup.out | wc -l) # && echo $PROCESSES | ||
done | ||
|
||
sudo -E env "PATH=$PATH" python examples/measurements_compaction.py | ||
|
||
sudo kill -9 $PID |
Oops, something went wrong.