From 63da1bf95e16a6681b2bcd01116e36625c508add Mon Sep 17 00:00:00 2001 From: Jane Herriman <> Date: Mon, 3 Jun 2024 19:58:03 -0700 Subject: [PATCH] update job submission details --- episodes/01-introduction.md | 14 +++--- episodes/02-maestro_on_the_cluster.md | 68 ++++++++++++++------------- episodes/03-maestro-and-mpi.md | 51 +++++++++++--------- episodes/04-placeholders.md | 14 +++--- episodes/05-chaining_rules.md | 28 ++++++----- episodes/06-multiple-parameters.md | 14 +++--- 6 files changed, 104 insertions(+), 85 deletions(-) diff --git a/episodes/01-introduction.md b/episodes/01-introduction.md index 2b7eb47..c18905a 100644 --- a/episodes/01-introduction.md +++ b/episodes/01-introduction.md @@ -229,15 +229,15 @@ Where would `Hello` be written for the following YAML? ```yml description: - name: MyHello - description: Report a node's hostname. + name: MyHello + description: Report a node's hostname. study: - - name: give-salutation - description: Write the login node's hostname to a file - run: - cmd: | - echo "hello" > greeting.txt + - name: give-salutation + description: Write the login node's hostname to a file + run: + cmd: | + echo "hello" > greeting.txt ``` 1. `~/give-salutation_{date}_{time}/greeting/greeting.txt` diff --git a/episodes/02-maestro_on_the_cluster.md b/episodes/02-maestro_on_the_cluster.md index d006ed4..d8c178b 100644 --- a/episodes/02-maestro_on_the_cluster.md +++ b/episodes/02-maestro_on_the_cluster.md @@ -33,10 +33,11 @@ should run. ```yml batch: - type: slurm - host: quartz # enter the machine you'll run on - bank: guests # enter the bank to charge - queue: pdebug # enter the partition in which your job should run + type: slurm + host: ruby # enter the machine you'll run on + bank: guests # enter the bank to charge + queue: pbatch # partition in which your job should run + reservation: HPCC1B # reservation for this workshop ``` Second, we need to specify the number of nodes, number of processes, @@ -47,11 +48,11 @@ a time limit of 30 seconds: ```yml (...) run: - cmd: | - hostname >> hostname.txt - nodes: 1 - procs: 1 - walltime: "00:00:30" + cmd: | + hostname >> hostname.txt + nodes: 1 + procs: 1 + walltime: "00:00:30" ``` Whereas `run` previously held only info about the command we wanted to @@ -63,26 +64,27 @@ With these changes, our updated YAML file might look like ```yml description: - name: Hostnames - description: Report a node's hostname. + name: Hostnames + description: Report a node's hostname. batch: - type: slurm - host: quartz # machine to run on - bank: guests # bank - queue: pdebug # partition + type: slurm + host: ruby # machine + bank: guests # bank + queue: pbatch # partition + reservation: HPCC1B # reservation for this workshop study: - - name: hostname-login - description: Write the login node's hostname to a file - run: - cmd: | - hostname > hostname_login.txt - - name: hostname_batch - description: Write the node's hostname to a file - run: - cmd: | - hostname >> hostname.txt + - name: hostname-login + description: Write the login node's hostname to a file + run: + cmd: | + hostname > hostname_login.txt + - name: hostname_batch + description: Write the node's hostname to a file + run: + cmd: | + hostname >> hostname.txt nodes: 1 procs: 1 walltime: "00:00:30" @@ -99,8 +101,8 @@ slurm. ## Running on the cluster Modify your YAML file, `hostname.yaml` to execute `hostname` on the -_cluster_. Run with 1 node and 1 process using the bank `guest` on -the partition `psummer` on `quartz`. +_cluster_. Run with 1 node and 1 process using the bank `guests` on +the partition `pbatch` on `ruby`. If you run this multiple times, do you always run on the same node? (Is the hostname printed always the same?) @@ -116,9 +118,10 @@ description: batch: type: slurm - host: quartz # machine to run on - bank: guest # bank - queue: psummer # partition + host: ruby # machine + bank: guests # bank + queue: pbatch # partition + reservation: HPCC1B # reservation for this workshop study: - name: hostname-login @@ -149,8 +152,9 @@ subdirectory `hostname_batch`, you'll find a file called command ran. If you run the job multiple times, you will probably land on different nodes; this means you'll see different node numbers in different `hostname.txt` files. If you see the same number more than -once, don't worry! If you get any answer other than `pascal83`, you're -doing it correctly. :) +once, don't worry! (If you want to double check that the hostnames +printed are not for login nodes, you can run `nodeattr -c login` to +check the IDs of all login nodes on the system.) :::::: diff --git a/episodes/03-maestro-and-mpi.md b/episodes/03-maestro-and-mpi.md index 63d062e..b7a293f 100644 --- a/episodes/03-maestro-and-mpi.md +++ b/episodes/03-maestro-and-mpi.md @@ -143,9 +143,10 @@ description: batch: type: slurm - host: quartz # machine to run on - bank: guests # bank - queue: pdebug # partition + host: ruby # machine + bank: guests # bank + queue: pbatch # partition + reservation: HPCC1B # reservation for this workshop study: - name: amdahl @@ -184,9 +185,10 @@ description: batch: type: slurm - host: quartz # machine to run on - bank: guests # bank - queue: pdebug # partition + host: ruby # machine + bank: guests # bank + queue: pbatch # partition + reservation: HPCC1B # reservation for this workshop study: - name: amdahl @@ -224,7 +226,7 @@ parallel proportion of the workload. Hello, World! I am process 0 of 1 on pascal17. I will do all the serial 'work' for 5.324555 seconds. - + Hello, World! I am process 0 of 1 on pascal17. I will do parallel 'work' for 22.349517 seconds. @@ -298,9 +300,10 @@ description: batch: type: slurm - host: quartz # machine to run on - bank: guests # bank - queue: pdebug # partition + host: ruby # machine + bank: guests # bank + queue: pbatch # partition + reservation: HPCC1B # reservation for this workshop study: - name: amdahl @@ -372,9 +375,10 @@ description: batch: type: slurm - host: quartz # machine to run on - bank: guests # bank - queue: pdebug # partition + host: ruby # machine + bank: guests # bank + queue: pbatch # partition + reservation: HPCC1B # reservation for this workshop study: - name: amdahl @@ -401,9 +405,10 @@ description: batch: type: slurm - host: quartz # machine to run on - bank: guests # bank - queue: pdebug # partition + host: ruby # machine + bank: guests # bank + queue: pbatch # partition + reservation: HPCC1B # reservation for this workshop study: - name: amdahl @@ -432,9 +437,10 @@ description: batch: type: slurm - host: quartz # machine to run on - bank: guests # bank - queue: pdebug # partition + host: ruby # machine + bank: guests # bank + queue: pbatch # partition + reservation: HPCC1B # reservation for this workshop study: - name: amdahl @@ -484,9 +490,10 @@ description: batch: type: slurm - host: quartz # machine to run on - bank: guests # bank - queue: pdebug # partition + host: ruby # machine + bank: guests # bank + queue: pbatch # partition + reservation: HPCC1B # reservation for this workshop env: variables: diff --git a/episodes/04-placeholders.md b/episodes/04-placeholders.md index 94b60fe..415704b 100644 --- a/episodes/04-placeholders.md +++ b/episodes/04-placeholders.md @@ -190,9 +190,10 @@ description: batch: type: slurm - host: quartz # machine to run on - bank: guests # bank - queue: pdebug # partition + host: ruby # machine + bank: guests # bank + queue: pbatch # partition + reservation: HPCC1B # reservation for this workshop env: variables: @@ -274,9 +275,10 @@ description: batch: type: slurm - host: quartz # machine to run on - bank: guests # bank - queue: pdebug # partition + host: ruby # machine + bank: guests # bank + queue: pbatch # partition + reservation: HPCC1B # reservation for this workshop env: variables: diff --git a/episodes/05-chaining_rules.md b/episodes/05-chaining_rules.md index 3285959..f815b55 100644 --- a/episodes/05-chaining_rules.md +++ b/episodes/05-chaining_rules.md @@ -52,9 +52,10 @@ description: batch: type: slurm - host: quartz # machine to run on - bank: guests # bank - queue: pdebug # partition + host: ruby # machine + bank: guests # bank + queue: pbatch # partition + reservation: HPCC1B # reservation for this workshop env: variables: @@ -216,9 +217,10 @@ description: batch: type: slurm - host: quartz # machine to run on - bank: guests # bank - queue: pdebug # partition + host: ruby # machine + bank: guests # bank + queue: pbatch # partition + reservation: HPCC1B # reservation for this workshop env: variables: @@ -341,9 +343,10 @@ description: batch: type: slurm - host: pascal # machine to run on - bank: lc #bank - queue: pvis # partition + host: ruby # machine + bank: guests # bank + queue: pbatch # partition + reservation: HPCC1B # reservation for this workshop env: variables: @@ -568,9 +571,10 @@ description: batch: type: slurm - host: quartz # machine to run on - bank: guests # bank - queue: pdebug # partition + host: ruby # machine + bank: guests # bank + queue: pbatch # partition + reservation: HPCC1B # reservation for this workshop env: variables: diff --git a/episodes/06-multiple-parameters.md b/episodes/06-multiple-parameters.md index d038916..a8758c2 100644 --- a/episodes/06-multiple-parameters.md +++ b/episodes/06-multiple-parameters.md @@ -93,9 +93,10 @@ description: batch: type: slurm - host: quartz # machine to run on - bank: guests # bank - queue: pdebug # partition + host: ruby # machine + bank: guests # bank + queue: pbatch # partition + reservation: HPCC1B # reservation for this workshop env: variables: @@ -249,9 +250,10 @@ description: batch: type: slurm - host: quartz # machine to run on - bank: guests # bank - queue: pdebug # partition + host: ruby # machine + bank: guests # bank + queue: pbatch # partition + reservation: HPCC1B # reservation for this workshop env: variables: