changeset 172:72b0420167dc

generalised sbatch front-end to cdx2tsv.py
author Henry S. Thompson <ht@inf.ed.ac.uk>
date Thu, 28 Jul 2022 17:24:29 +0100
parents c7d57d158331
children bc791ff523e7
files bin/c2t.sh
diffstat 1 files changed, 18 insertions(+), 0 deletions(-) [+]
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/bin/c2t.sh	Thu Jul 28 17:24:29 2022 +0100
@@ -0,0 +1,18 @@
+#!/bin/bash
+# Invoke this as e.g. sbatch -N 4 --ntasks=10 -c 15 c2t.sh \
+#                     CC-MAIN-2019-35 cdx_counts 0 299 1 \
+#                     '(filename,f.split(/,maxsplit=5)[4][0])' ...
+
+
+#SBATCH --time=01:00:00
+#SBATCH --partition=standard
+#SBATCH --qos=standard
+#SBATCH --account=ec184-guest
+#SBATCH --job-name c2t
+
+export W=/work/dc007/dc007
+
+echo $(date) Launching $SLURM_JOB_NUM_NODES nodes for c2t "$@" from $(hostname) to do $SLURM_NTASKS tasks, $SLURM_CPUS_PER_TASK cpus each
+
+srun -c $SLURM_CPUS_PER_TASK $W/shared/bin/sing $W/hst/bin/_c2t.sh "$@"
+