From 74557748480153ee1e4194b3463a983b97ffd736 Mon Sep 17 00:00:00 2001
From: jfgrimm <jasper.grimm@york.ac.uk>
Date: Mon, 22 Jan 2024 12:17:34 +0000
Subject: [PATCH 1/8] adding easyconfigs:
 ESM-2-2.0.0-foss-2023a-CUDA-12.1.1.eb,
 topaz-0.2.5.20231120-foss-2023a-CUDA-12.1.1.eb,
 torchvision-0.16.2-foss-2023a-CUDA-12.1.1.eb

---
 .../ESM-2-2.0.0-foss-2023a-CUDA-12.1.1.eb     | 42 ++++++++++++++
 ...z-0.2.5.20231120-foss-2023a-CUDA-12.1.1.eb | 55 +++++++++++++++++++
 ...rchvision-0.16.2-foss-2023a-CUDA-12.1.1.eb | 27 +++++++++
 3 files changed, 124 insertions(+)
 create mode 100644 easybuild/easyconfigs/e/ESM-2/ESM-2-2.0.0-foss-2023a-CUDA-12.1.1.eb
 create mode 100644 easybuild/easyconfigs/t/topaz/topaz-0.2.5.20231120-foss-2023a-CUDA-12.1.1.eb
 create mode 100644 easybuild/easyconfigs/t/torchvision/torchvision-0.16.2-foss-2023a-CUDA-12.1.1.eb

diff --git a/easybuild/easyconfigs/e/ESM-2/ESM-2-2.0.0-foss-2023a-CUDA-12.1.1.eb b/easybuild/easyconfigs/e/ESM-2/ESM-2-2.0.0-foss-2023a-CUDA-12.1.1.eb
new file mode 100644
index 000000000000..eae9330bcdb3
--- /dev/null
+++ b/easybuild/easyconfigs/e/ESM-2/ESM-2-2.0.0-foss-2023a-CUDA-12.1.1.eb
@@ -0,0 +1,42 @@
+easyblock = 'PythonBundle'
+
+name = 'ESM-2'
+version = '2.0.0'
+versionsuffix = '-CUDA-%(cudaver)s'
+
+homepage = 'https://github.com/facebookresearch/esm'
+description = """ESM-2 outperforms all tested single-sequence protein language models
+ across a range of structure prediction tasks. ESMFold harnesses the ESM-2 language model to generate
+ accurate structure predictions end to end directly from the sequence of a protein."""
+
+toolchain = {'name': 'foss', 'version': '2023a'}
+
+builddependencies = [
+    ('Java', '11', '', SYSTEM),  # needed by ANTLR4 runtime
+]
+
+dependencies = [
+    ('CUDA', '12.1.1', '', SYSTEM),
+    ('Python', '3.11.3'),
+    ('PyTorch', '2.1.2', versionsuffix),
+]
+
+use_pip = True
+sanity_pip_check = True
+
+# omegaconf is required for esmfold (in addition to OpenFold-1.0.1)
+exts_list = [
+    ('antlr4-python3-runtime', '4.9.3', {
+        'modulename': 'antlr4',
+        'checksums': ['f224469b4168294902bb1efa80a8bf7855f24c99aef99cbefc1bcd3cce77881b'],
+    }),
+    ('omegaconf', '2.3.0', {
+        'checksums': ['d5d4b6d29955cc50ad50c46dc269bcd92c6e00f5f90d23ab5fee7bfca4ba4cc7'],
+    }),
+    ('fair-esm', version, {
+        'modulename': "esm, esm.pretrained",
+        'checksums': ['4ed34d4598ec75ed6550a4e581d023bf8d4a8375317ecba6269bb68135f80c85'],
+    }),
+]
+
+moduleclass = 'bio'
diff --git a/easybuild/easyconfigs/t/topaz/topaz-0.2.5.20231120-foss-2023a-CUDA-12.1.1.eb b/easybuild/easyconfigs/t/topaz/topaz-0.2.5.20231120-foss-2023a-CUDA-12.1.1.eb
new file mode 100644
index 000000000000..a99c772078df
--- /dev/null
+++ b/easybuild/easyconfigs/t/topaz/topaz-0.2.5.20231120-foss-2023a-CUDA-12.1.1.eb
@@ -0,0 +1,55 @@
+# Thomas Hoffman, EMBL Heidelberg, structures-it@embl.de, 2023/11 
+easyblock = 'PythonPackage'
+
+name = 'topaz'
+_mainversion = '0.2.5'
+_commitdate = '20231120'
+_commit = '25cb2cb'
+version = '%s.%s' % (_mainversion, _commitdate)
+versionsuffix = '-CUDA-%(cudaver)s'
+
+homepage = 'http://cb.csail.mit.edu/cb/topaz/'
+
+description = """Particle picking software for single particle cryo-electron microscopy using    
+convolutional neural networks and positive-unlabeled learning. Includes methods
+for micrograph denoising."""
+
+toolchain = {'name': 'foss', 'version': '2023a'}
+
+dependencies = [
+    ('CUDA', '12.1.1', '', SYSTEM),
+    ('Python', '3.11.3'),
+    ('SciPy-bundle', '2023.07'),
+    ('PyTorch', '2.1.2', versionsuffix),
+    ('scikit-learn', '1.3.1'),
+    ('torchvision', '0.16.2', versionsuffix),
+]
+
+source_urls = ['https://github.com/tbepler/topaz/archive']
+sources = [{
+    'download_filename': '%s.tar.gz' % _commit,
+    'filename': '%(name)s-%(version)s.tar.gz'
+}]
+patches = [
+    'topaz-0.2.5_install_relion3_wrappers.patch',
+]
+checksums = [
+    {'topaz-0.2.5.20231120.tar.gz': 'ca0630f9a69622eb3e10c9de310f58ac846e60a5504c4533398a9a75b3091df9'},
+    {'topaz-0.2.5_install_relion3_wrappers.patch': '0fe23a0ecaf887aaa89641a7e7cf37fafd3134384b0a8f46acb4e17537d1a151'},
+]
+
+download_dep_fail = True
+use_pip = True
+sanity_pip_check = True
+
+options = {'modulename': 'topaz'}
+
+_relion3_wrappers = ['denoise', 'pick', 'train', 'train_denoise']
+
+sanity_check_paths = {
+    'files': ["bin/run_topaz_%s.py" % x for x in _relion3_wrappers],
+    'dirs': [],
+}
+sanity_check_commands = ['run_topaz_%s.py --help' % x for x in _relion3_wrappers] + ['topaz --help']
+
+moduleclass = 'chem'
diff --git a/easybuild/easyconfigs/t/torchvision/torchvision-0.16.2-foss-2023a-CUDA-12.1.1.eb b/easybuild/easyconfigs/t/torchvision/torchvision-0.16.2-foss-2023a-CUDA-12.1.1.eb
new file mode 100644
index 000000000000..a72f7b8760aa
--- /dev/null
+++ b/easybuild/easyconfigs/t/torchvision/torchvision-0.16.2-foss-2023a-CUDA-12.1.1.eb
@@ -0,0 +1,27 @@
+name = 'torchvision'
+version = '0.16.2'
+versionsuffix = '-CUDA-%(cudaver)s'
+
+homepage = 'https://github.com/pytorch/vision'
+description = " Datasets, Transforms and Models specific to Computer Vision"
+
+toolchain = {'name': 'foss', 'version': '2023a'}
+
+source_urls = ['https://github.com/pytorch/vision/archive']
+sources = ['v%(version)s.tar.gz']
+patches = ['%(name)s-0.16.2_ffmpeg-6.0-fix.patch']
+checksums = [
+    {'v0.16.2.tar.gz': '8c1f2951e98d8ada6e5a468f179af4be9f56d2ebc3ab057af873da61669806d7'},
+    {'torchvision-0.16.2_ffmpeg-6.0-fix.patch': 'a49336e7bfa1c950e886852bff37a3ea2146ac7bda87241e3ffb31c5cb869cce'},
+]
+
+builddependencies = [('CMake', '3.26.3')]
+
+dependencies = [
+    ('CUDA', '12.1.1', '', SYSTEM),
+    ('Python', '3.11.3'),
+    ('Pillow-SIMD', '9.5.0'),
+    ('PyTorch', '2.1.2', '-CUDA-%(cudaver)s'),
+]
+
+moduleclass = 'vis'

From c7410dcdb1410136b7e3a816bff669c3b9478c89 Mon Sep 17 00:00:00 2001
From: jfgrimm <jasper.grimm@york.ac.uk>
Date: Wed, 24 Jan 2024 12:00:36 +0000
Subject: [PATCH 2/8] add torchvision patch

---
 .../torchvision-0.16.2_ffmpeg-6.0-fix.patch   | 36 +++++++++++++++++++
 1 file changed, 36 insertions(+)
 create mode 100644 easybuild/easyconfigs/t/torchvision/torchvision-0.16.2_ffmpeg-6.0-fix.patch

diff --git a/easybuild/easyconfigs/t/torchvision/torchvision-0.16.2_ffmpeg-6.0-fix.patch b/easybuild/easyconfigs/t/torchvision/torchvision-0.16.2_ffmpeg-6.0-fix.patch
new file mode 100644
index 000000000000..7a3637f3adc9
--- /dev/null
+++ b/easybuild/easyconfigs/t/torchvision/torchvision-0.16.2_ffmpeg-6.0-fix.patch
@@ -0,0 +1,36 @@
+From 86620bd84b872b76db0acafec167949dca03a29e Mon Sep 17 00:00:00 2001
+From: =?UTF-8?q?Zolt=C3=A1n=20B=C3=B6sz=C3=B6rm=C3=A9nyi?=
+ <zboszor@gmail.com>
+Date: Tue, 7 Nov 2023 10:43:11 +0100
+Subject: [PATCH] Fix build with ffmpeg 6.0
+MIME-Version: 1.0
+Content-Type: text/plain; charset=UTF-8
+Content-Transfer-Encoding: 8bit
+
+Signed-off-by: Zoltán Böszörményi <zboszor@gmail.com>
+---
+ torchvision/csrc/io/decoder/stream.cpp | 11 ++---------
+ 1 file changed, 2 insertions(+), 9 deletions(-)
+
+diff --git a/torchvision/csrc/io/decoder/stream.cpp b/torchvision/csrc/io/decoder/stream.cpp
+index 0d625ef211c..8c914050587 100644
+--- a/torchvision/csrc/io/decoder/stream.cpp
++++ b/torchvision/csrc/io/decoder/stream.cpp
+@@ -63,15 +63,8 @@ int Stream::openCodec(std::vector<DecoderMetadata>* metadata, int num_threads) {
+     codecCtx_->thread_count = num_threads;
+   } else {
+     // otherwise set sensible defaults
+-    // with the special case for the different MPEG4 codecs
+-    // that don't have threading context functions
+-    if (codecCtx_->codec->capabilities & AV_CODEC_CAP_INTRA_ONLY) {
+-      codecCtx_->thread_type = FF_THREAD_FRAME;
+-      codecCtx_->thread_count = 2;
+-    } else {
+-      codecCtx_->thread_count = 8;
+-      codecCtx_->thread_type = FF_THREAD_SLICE;
+-    }
++    codecCtx_->thread_count = 8;
++    codecCtx_->thread_type = FF_THREAD_SLICE;
+   }
+ 
+   int ret;

From 9a19bb3bb5f36a87d4d4c0752fed69d782acb45c Mon Sep 17 00:00:00 2001
From: jfgrimm <jasper.grimm@york.ac.uk>
Date: Fri, 2 Feb 2024 11:32:04 +0000
Subject: [PATCH 3/8] add 3dem patches for topaz

---
 ...z-0.2.5.20231120-foss-2023a-CUDA-12.1.1.eb |  11 +-
 ....5.20231120_helical-filament-picking.patch | 289 ++++++++++++++++++
 ...az-0.2.5.20231120_update-description.patch |  24 ++
 3 files changed, 322 insertions(+), 2 deletions(-)
 create mode 100644 easybuild/easyconfigs/t/topaz/topaz-0.2.5.20231120_helical-filament-picking.patch
 create mode 100644 easybuild/easyconfigs/t/topaz/topaz-0.2.5.20231120_update-description.patch

diff --git a/easybuild/easyconfigs/t/topaz/topaz-0.2.5.20231120-foss-2023a-CUDA-12.1.1.eb b/easybuild/easyconfigs/t/topaz/topaz-0.2.5.20231120-foss-2023a-CUDA-12.1.1.eb
index a99c772078df..877445f182e2 100644
--- a/easybuild/easyconfigs/t/topaz/topaz-0.2.5.20231120-foss-2023a-CUDA-12.1.1.eb
+++ b/easybuild/easyconfigs/t/topaz/topaz-0.2.5.20231120-foss-2023a-CUDA-12.1.1.eb
@@ -1,4 +1,4 @@
-# Thomas Hoffman, EMBL Heidelberg, structures-it@embl.de, 2023/11 
+# Thomas Hoffman, EMBL Heidelberg, structures-it@embl.de, 2023/11
 easyblock = 'PythonPackage'
 
 name = 'topaz'
@@ -10,7 +10,7 @@ versionsuffix = '-CUDA-%(cudaver)s'
 
 homepage = 'http://cb.csail.mit.edu/cb/topaz/'
 
-description = """Particle picking software for single particle cryo-electron microscopy using    
+description = """Particle picking software for single particle cryo-electron microscopy using
 convolutional neural networks and positive-unlabeled learning. Includes methods
 for micrograph denoising."""
 
@@ -23,6 +23,7 @@ dependencies = [
     ('PyTorch', '2.1.2', versionsuffix),
     ('scikit-learn', '1.3.1'),
     ('torchvision', '0.16.2', versionsuffix),
+    ('scikit-image', '0.22.0'),
 ]
 
 source_urls = ['https://github.com/tbepler/topaz/archive']
@@ -32,10 +33,16 @@ sources = [{
 }]
 patches = [
     'topaz-0.2.5_install_relion3_wrappers.patch',
+    'topaz-0.2.5.20231120_helical-filament-picking.patch',
+    'topaz-0.2.5.20231120_update-description.patch',
 ]
 checksums = [
     {'topaz-0.2.5.20231120.tar.gz': 'ca0630f9a69622eb3e10c9de310f58ac846e60a5504c4533398a9a75b3091df9'},
     {'topaz-0.2.5_install_relion3_wrappers.patch': '0fe23a0ecaf887aaa89641a7e7cf37fafd3134384b0a8f46acb4e17537d1a151'},
+    {'topaz-0.2.5.20231120_helical-filament-picking.patch':
+     '320466e4ac1d1f06ba392a419aefa369905baa6877717868cd8ea7135b6bc28f'},
+    {'topaz-0.2.5.20231120_update-description.patch':
+     '073241dba2de63e543136a387ff7ef698a5e0139ab3356de021e370338fa57c1'},
 ]
 
 download_dep_fail = True
diff --git a/easybuild/easyconfigs/t/topaz/topaz-0.2.5.20231120_helical-filament-picking.patch b/easybuild/easyconfigs/t/topaz/topaz-0.2.5.20231120_helical-filament-picking.patch
new file mode 100644
index 000000000000..2e8413fd5e34
--- /dev/null
+++ b/easybuild/easyconfigs/t/topaz/topaz-0.2.5.20231120_helical-filament-picking.patch
@@ -0,0 +1,289 @@
+From 4ea1710c88648ff4c5f7232e20ad5d9aa9535241 Mon Sep 17 00:00:00 2001
+From: scheres <scheres@mrc-lmb.cam.ac.uk>
+Date: Wed, 5 Jan 2022 12:13:10 +0000
+Subject: [PATCH] implemented helical filament picking in extract.py
+
+---
+ topaz/commands/extract.py | 225 ++++++++++++++++++++++++++++++++++++--
+ 1 file changed, 215 insertions(+), 10 deletions(-)
+
+diff --git a/topaz/commands/extract.py b/topaz/commands/extract.py
+index 3c3f032..6676618 100644
+--- a/topaz/commands/extract.py
++++ b/topaz/commands/extract.py
+@@ -52,6 +52,11 @@ def add_arguments(parser):
+     parser.add_argument('--targets', help='path to file specifying particle coordinates. used to find extraction radius that maximizes the AUPRC') 
+     parser.add_argument('--only-validate', action='store_true', help='flag indicating to only calculate validation metrics. does not report full prediction list')
+ 
++    # Filament picking SHWS 30032021
++    parser.add_argument('-f', '--filaments', action='store_true', help='flag for filament start-end picking.')
++    parser.add_argument('-fp', '--filaments_plot', action='store_true', help='flag for filament start-end picking plus plotting of its intermediate stages (useful for tuning parameters).')
++    parser.add_argument('-fl', '--filaments_length', default=-1, type=int, help='minimum length of straight filament segments to be picked (in Angstrom) (default: twice --radius)')
++
+     parser.add_argument('-d', '--device', default=0, type=int, help='which device to use, <0 corresponds to CPU')
+ 
+     parser.add_argument('-o', '--output', help='file path to write')
+@@ -63,24 +68,219 @@ def add_arguments(parser):
+ 
+     return parser
+ 
++
++def is_in_between(point, line):
++    dx = line[1][0] - line[0][0]
++    dy = line[1][1] - line[0][1]
++    dotp = (point[0] - line[0][0])*dx + (point[1] - line[0][1])*dy
++    return 0 <= dotp and dotp <= dx*dx + dy*dy
++
++def distance_point_line(point, line):
++    x1=line[0][0]
++    x2=line[1][0]
++    y1=line[0][1]
++    y2=line[1][1]
++    x0=point[0]
++    y0=point[1]
++    dd = abs( (x2-x1)*(y1-y0) - (x1-x0)*(y2-y1) ) / np.sqrt( (x2-x1)*(x2-x1) + (y2-y1)*(y2-y1) )
++    if not is_in_between(point,line):
++        closest = min(distance_point_point(point,line[0]), distance_point_point(point,line[1]))
++        return max(closest, dd)
++    else:
++        return dd
++
++def distance_point_point(point1, point2):
++    x1=point1[0]
++    y1=point1[1]
++    x2=point2[0]
++    y2=point2[1]
++    return np.sqrt((x1-x2)*(x1-x2) + (y1-y2)*(y1-y2))
++
++def angle_line_line(line1, line2):
++    a1 = np.arctan2(line1[1][1]-line1[0][1], line1[1][0]-line1[0][0])
++    a2 = np.arctan2(line2[1][1]-line2[0][1], line2[1][0]-line2[0][0])
++    return abs(a2-a1)
++
++def prune_lines(inlines, mind, min_ang, max_merge):
++    import math
++    lengths = []
++    merged = []
++    lines = np.asarray(inlines)
++    for line in lines:
++        lengths = np.append(lengths, np.linalg.norm(line[0]-line[1]))
++        merged = np.append(merged, 1)
++    sortidx = np.argsort(lengths);
++
++    min_ang_rad = math.radians(min_ang)
++    NN = len(sortidx)
++    idx = NN - 1
++    while idx >= 0:
++        i1 = sortidx[idx]
++
++        for i2 in range(NN):
++            if (i1 != i2 and lengths[i2] > 0. and lengths[i1] > 0.):
++                
++                d11 = distance_point_line(lines[i1][0],lines[i2])
++                d12 = distance_point_line(lines[i1][1],lines[i2])
++                d21 = distance_point_line(lines[i2][0],lines[i1])
++                d22 = distance_point_line(lines[i2][1],lines[i1])
++                ang = angle_line_line(lines[i1], lines[i2])
++                sum = 0
++                if (d11 < mind):
++                    sum = sum + 1
++                if (d12 < mind):
++                    sum = sum + 1
++                if (d21 < mind):
++                    sum = sum + 1
++                if (d22 < mind):
++                    sum = sum + 1
++
++                # merge lines if they haven't been merged too often already, they overlap two or more points and are parallel
++                if ( (merged[i1] + merged[i2] < max_merge) and (sum >= 2) and (ang < min_ang_rad or abs(ang-math.pi) < min_ang_rad) ):
++
++                    # select the two points with the furthest distance
++                    maxd=0
++                    for i in range(2):
++                        for j in range(2):
++                            d = distance_point_point(lines[i1][i], lines[i2][j])
++                            if (d > maxd):
++                                maxd = d
++                                mymax0 = lines[i1][i]
++                                mymax1 = lines[i2][j]
++                    # perhaps original one was longer?
++                    if maxd > lengths[i1]:
++                        lines[i1][0] = mymax0
++                        lines[i1][1] = mymax1
++                        lengths[i1] = np.linalg.norm(lines[i1][0]-lines[i1][1])
++                        merged[i1] = merged[i1] + merged[i2]
++                    
++                    lines[i2][0][0] = -9999
++                    lines[i2][0][1] = -9999
++                    lines[i2][1][0] = -9999
++                    lines[i2][1][1] = -9999
++                    lengths[i2] = 0
++                    merged[i2] = 0
++                    idx = idx + 1
++                    break
++
++                # remove smaller lines with both points close to longer one
++                elif (d21 < mind and d22 < mind):
++                    lines[i2][0][0] = -9999
++                    lines[i2][0][1] = -9999
++                    lines[i2][1][0] = -9999
++                    lines[i2][1][1] = -9999
++                    lengths[i2] = 0
++
++        idx = idx - 1
++
++    return lines
++
++
++def pick_filaments(score, radius, threshold, filaments_length, filaments_plot):
++    from topaz import mrc
++    from skimage.filters import gaussian
++    from skimage.transform import probabilistic_hough_line
++    from skimage.morphology import skeletonize
++    import math
++
++    #Parameters
++    thr = round(0.1*filaments_length)
++    line_length = filaments_length
++    gap = radius
++    mind= radius
++    min_angle = 10
++    max_merge = 5
++
++    bin_score = (gaussian(score, 3) > threshold)        
++    edges = skeletonize(bin_score) 
++    houghs = probabilistic_hough_line(edges, threshold=thr, line_length=line_length, line_gap=gap)
++    lines = prune_lines(houghs, mind=mind, min_ang=min_angle, max_merge=max_merge)
++
++    if filaments_plot:
++        import matplotlib.pyplot as plt
++        from matplotlib import cm
++        fig, axes = plt.subplots(1, 4, figsize=(15, 5), sharex=True, sharey=True)
++        ax = axes.ravel()
++
++        ax[0].imshow(score, cmap=cm.binary, vmin=-20, vmax=5)
++        ax[0].imshow(bin_score, alpha=0.5, cmap=cm.Reds)
++        ax[0].set_title('FOM [-20,5] thr= ' + str(threshold))
++
++        ax[1].imshow(edges, cmap=cm.gray)
++        ax[1].set_title('Skeletonize')
++
++        ax[2].imshow(edges * 0)
++        for hough in houghs:
++            p0, p1 = hough
++            ax[2].plot((p0[0], p1[0]), (p0[1], p1[1]))
++        ax[2].set_xlim((0, score.shape[1]))
++        ax[2].set_ylim((score.shape[0], 0))
++        ax[2].set_title('Hough transform; len= ' + str(line_length) + ' gap= ' + str(gap))
++
++        ax[3].imshow(edges * 0)
++        for line in lines:
++            p0, p1 = line
++            ax[3].plot((p0[0], p1[0]), (p0[1], p1[1]))
++        ax[3].set_xlim((0, score.shape[1]))
++        ax[3].set_ylim((score.shape[0], 0))
++        ax[3].set_title('Prune: mind= ' + str(mind))
++
++        for a in ax:
++            a.set_axis_off()
++
++        plt.tight_layout()
++        plt.show()
++
++    oldlines=lines
++    # Flatten lines into 2D array, as rest of topaz
++    NN=len(lines)
++    if NN>0:
++        lines = lines.reshape(2*NN, 2)
++        # Remove -9999 coordinates
++        newlines = []
++        for i in range(2*NN):
++            if (lines[i,0] != -9999 and lines[i,1] != -9999):
++                newlines = np.append(newlines, lines[i])
++
++        NN=round(len(newlines)/2)
++        if (NN>0):
++            lines = newlines.reshape(NN, 2)
++        else:
++            lines = []
++
++    # Just set scores to zero, a they are meaningless now
++    scores = np.zeros(NN, dtype=np.float32)
++
++    return scores, lines
++
++
+ class NonMaximumSuppression:
+-    def __init__(self, radius, threshold):
++    def __init__(self, radius, threshold, do_filaments=False, filaments_length=150, filaments_plot=False):
+         self.radius = radius
+         self.threshold = threshold
++        self.do_filaments = do_filaments
++        self.filaments_length = filaments_length
++        self.filaments_plot = filaments_plot
+ 
+     def __call__(self, args):
+         name,score = args
+-        score,coords = non_maximum_suppression(score, self.radius, threshold=self.threshold)
+-        return name, score, coords
++        if self.do_filaments:
++            score,coords = pick_filaments(score, self.radius, threshold=self.threshold, length=self.filaments_length, filaments_plot = self.filaments_plot )
++        else:
++            score,coords = non_maximum_suppression(score, self.radius, threshold=self.threshold, length=self.filaments_length)
++        return name, core, coords
+ 
+-def nms_iterator(scores, radius, threshold, pool=None):
+-    process = NonMaximumSuppression(radius, threshold)
++def nms_iterator(scores, radius, threshold, pool=None, do_filaments=False, filaments_length=150, filaments_plot=False):
++    process = NonMaximumSuppression(radius, threshold, do_filaments, filaments_length, filaments_plot)
+     if pool is not None:
+         for name,score,coords in pool.imap_unordered(process, scores):
+             yield name,score,coords
+     else:
+         for name,score in scores:
+-            score,coords = non_maximum_suppression(score, radius, threshold=threshold)
++            if do_filaments:
++                score,coords = pick_filaments(score, radius, threshold=threshold, filaments_length=filaments_length, filaments_plot=filaments_plot)
++            else:
++                score,coords = non_maximum_suppression(score, radius, threshold=threshold)
+             yield name,score,coords
+ 
+ def iterate_score_target_pairs(scores, targets):
+@@ -231,6 +431,12 @@ def main(args):
+     if radius is None:
+         radius = -1
+ 
++    do_filaments = args.filaments or args.filaments_plot
++    filaments_length = args.filaments_length
++    if (filaments_length < 0):
++        filaments_length = 2 * radius
++    filaments_plot = args.filaments_plot
++
+     num_workers = args.num_workers
+     pool = None
+     if num_workers < 0:
+@@ -284,12 +490,13 @@ def main(args):
+ 
+         if not per_micrograph:
+             print('image_name\tx_coord\ty_coord\tscore', file=f)
++
+         ## extract coordinates using radius 
+-        for path,score,coords in nms_iterator(stream, radius, threshold, pool=pool):
++        for path,score,coords in nms_iterator(stream, radius, threshold, pool=pool, do_filaments=do_filaments, filaments_length=filaments_length, filaments_plot=filaments_plot):
+             basename = os.path.basename(path)
+             name = os.path.splitext(basename)[0]
+             ## scale the coordinates
+-            if scale != 1:
++            if scale != 1 and len(coords)>0:
+                 coords = np.round(coords*scale).astype(int)
+ 
+             if per_micrograph:
+@@ -303,8 +510,6 @@ def main(args):
+                     print(name + '\t' + str(coords[i,0]) + '\t' + str(coords[i,1]) + '\t' + str(score[i]), file=f)
+ 
+ 
+-
+-
+ if __name__ == '__main__':
+     import argparse
+     parser = argparse.ArgumentParser('Script for extracting particles from segmented images or images processed with a trained model. Uses a non maximum suppression algorithm.')
diff --git a/easybuild/easyconfigs/t/topaz/topaz-0.2.5.20231120_update-description.patch b/easybuild/easyconfigs/t/topaz/topaz-0.2.5.20231120_update-description.patch
new file mode 100644
index 000000000000..f52fac9497d8
--- /dev/null
+++ b/easybuild/easyconfigs/t/topaz/topaz-0.2.5.20231120_update-description.patch
@@ -0,0 +1,24 @@
+From 14b2bc331768b67b3267397523de57c707fa1253 Mon Sep 17 00:00:00 2001
+From: scheres <scheres@mrc-lmb.cam.ac.uk>
+Date: Fri, 25 Mar 2022 09:27:07 +0000
+Subject: [PATCH] added description of new options and dependency on skimage
+
+---
+ README.md | 4 ++++
+ 1 file changed, 4 insertions(+)
+
+diff --git a/README.md b/README.md
+index bed6f4f..a98993c 100644
+--- a/README.md
++++ b/README.md
+@@ -3,6 +3,10 @@ A pipeline for particle detection in cryo-electron microscopy images using convo
+ 
+ **Check out our [Discussion](https://github.com/tbepler/topaz/discussions) section for general help, suggestions, and tips on using Topaz.**
+ 
++## New in modification for filament picking:
++- Added support for filament start-end coordinate picking (new options -f, -fp and -fl in the extract command), for subsequent helical reconstruction in RELION
++- This adds a new dependency to skimage (make sure you install this in your conda environment)
++
+ ## New in v0.2.5
+ - Added Relion integration scripts
+ - Topaz extract can now write particle coordinates to one file per input micrograph

From 8d01616883c03835b17f6c8725e3a197f2ebb5e4 Mon Sep 17 00:00:00 2001
From: jfgrimm <jasper.grimm@york.ac.uk>
Date: Tue, 27 Feb 2024 11:34:26 +0000
Subject: [PATCH 4/8] use PyTorch-bundle instead of separate torchvision
 easyconfig

---
 ...rch-bundle-2.1.2-foss-2023a-CUDA-12.1.1.eb | 79 +++++++++++++++++++
 .../SentencePiece-0.2.0-GCC-12.3.0.eb         | 65 +++++++++++++++
 ...rchvision-0.16.2-foss-2023a-CUDA-12.1.1.eb | 27 -------
 3 files changed, 144 insertions(+), 27 deletions(-)
 create mode 100644 easybuild/easyconfigs/p/PyTorch-bundle/PyTorch-bundle-2.1.2-foss-2023a-CUDA-12.1.1.eb
 create mode 100644 easybuild/easyconfigs/s/SentencePiece/SentencePiece-0.2.0-GCC-12.3.0.eb
 delete mode 100644 easybuild/easyconfigs/t/torchvision/torchvision-0.16.2-foss-2023a-CUDA-12.1.1.eb

diff --git a/easybuild/easyconfigs/p/PyTorch-bundle/PyTorch-bundle-2.1.2-foss-2023a-CUDA-12.1.1.eb b/easybuild/easyconfigs/p/PyTorch-bundle/PyTorch-bundle-2.1.2-foss-2023a-CUDA-12.1.1.eb
new file mode 100644
index 000000000000..344d73613b22
--- /dev/null
+++ b/easybuild/easyconfigs/p/PyTorch-bundle/PyTorch-bundle-2.1.2-foss-2023a-CUDA-12.1.1.eb
@@ -0,0 +1,79 @@
+easyblock = 'PythonBundle'
+
+name = 'PyTorch-bundle'
+version = '2.1.2'
+versionsuffix = '-CUDA-%(cudaver)s'
+
+homepage = 'https://pytorch.org/'
+description = """PyTorch with compatible versions of official Torch extensions."""
+
+toolchain = {'name': 'foss', 'version': '2023a'}
+
+builddependencies = [
+    ('CMake', '3.26.3'),
+    ('RE2', '2023-08-01'),  # for torchtext
+]
+
+dependencies = [
+    ('CUDA', '12.1.1', '', SYSTEM),
+    ('Python', '3.11.3'),
+    ('PyTorch', version, versionsuffix),
+    ('Pillow-SIMD', '9.5.0'),  # for torchvision
+    ('SentencePiece', '0.2.0'),  # for torchtext
+    ('tqdm', '4.66.1'),  # for torchtext
+    ('double-conversion', '3.3.0'),  # for torchtext
+    ('utf8proc', '2.8.0'),  # for torchtext
+    ('tensorboard', '2.15.1'),  # for torch-tb-profiler
+]
+
+use_pip = True
+
+exts_list = [
+    ('portalocker', '2.8.2', {
+        'checksums': ['2b035aa7828e46c58e9b31390ee1f169b98e1066ab10b9a6a861fe7e25ee4f33'],
+    }),
+    ('torchdata', '0.7.1', {
+        'preinstallopts': "USE_SYSTEM_LIBS=1 ",
+        'source_urls': ['https://github.com/pytorch/data/archive'],
+        'sources': [{'download_filename': 'v%(version)s.tar.gz', 'filename': '%(name)s-%(version)s.tar.gz'}],
+        'checksums': ['ef9bbdcee759b53c3c9d99e76eb0a66da33d36bfb7f859a25a9b5e737a51fa23'],
+    }),
+    ('torchtext', '0.17.1', {
+        'patches': [
+            'torchtext-0.14.1_use-system-libs.patch',
+        ],
+        'source_urls': ['https://github.com/pytorch/text/archive'],
+        'sources': [{'download_filename': 'v%(version)s.tar.gz', 'filename': '%(name)s-%(version)s.tar.gz'}],
+        'checksums': [
+            {'torchtext-0.17.1.tar.gz': '1b21c1efb13072465bc11dbb7b80e8bdc3aca3cee9234242f57f0503f3db47f5'},
+            {'torchtext-0.14.1_use-system-libs.patch':
+             '1366d10c4755b6003194f7313ca11d165a80a13d325bee9d669ea2b333d82536'},
+            {'torchtext-0.13.1_cxx_17.patch': 'fd242c139baa27352d1065cece4658a3ede76f46ffec08ac04a554301e547f22'},
+        ],
+    }),
+    ('torchvision', '0.16.2', {
+        'patches': ['torchvision-0.16.2_ffmpeg-6.0-fix.patch'],
+        'source_urls': ['https://github.com/pytorch/vision/archive'],
+        'sources': [{'download_filename': 'v%(version)s.tar.gz', 'filename': '%(name)s-%(version)s.tar.gz'}],
+        'checksums': [
+            {'torchvision-0.16.2.tar.gz': '8c1f2951e98d8ada6e5a468f179af4be9f56d2ebc3ab057af873da61669806d7'},
+            {'torchvision-0.16.2_ffmpeg-6.0-fix.patch':
+             'a49336e7bfa1c950e886852bff37a3ea2146ac7bda87241e3ffb31c5cb869cce'},
+        ],
+    }),
+    ('pytorch-ignite', '0.4.13', {
+        'modulename': 'ignite',
+        'source_urls': ['https://github.com/pytorch/ignite/archive'],
+        'sources': [{'download_filename': 'v%(version)s.tar.gz', 'filename': '%(name)s-%(version)s.tar.gz'}],
+        'checksums': ['bfe4b6f1cd96e78c021a65a0c51350cdb89d6ef5a8b9609638666ca95bae51d7'],
+    }),
+    ('torch-tb-profiler', '0.4.3', {
+        'modulename': 'torch.profiler',
+        'sources': ['torch_tb_profiler-%(version)s.tar.gz'],
+        'checksums': ['8b8d29b2de960b3c4423087b23cec29beaf9ac3a8c7b046c18fd25b218f726b1'],
+    }),
+]
+
+sanity_pip_check = True
+
+moduleclass = 'ai'
diff --git a/easybuild/easyconfigs/s/SentencePiece/SentencePiece-0.2.0-GCC-12.3.0.eb b/easybuild/easyconfigs/s/SentencePiece/SentencePiece-0.2.0-GCC-12.3.0.eb
new file mode 100644
index 000000000000..42c6e7f5281d
--- /dev/null
+++ b/easybuild/easyconfigs/s/SentencePiece/SentencePiece-0.2.0-GCC-12.3.0.eb
@@ -0,0 +1,65 @@
+##
+# Author:    Robert Mijakovic <robert.mijakovic@lxp.lu>
+##
+easyblock = 'Bundle'
+
+name = 'SentencePiece'
+version = '0.2.0'
+
+homepage = 'https://github.com/google/sentencepiece'
+description = "Unsupervised text tokenizer for Neural Network-based text generation."
+github_account = 'google'
+
+toolchain = {'name': 'GCC', 'version': '12.3.0'}
+
+builddependencies = [
+    ('CMake', '3.26.3'),
+]
+
+dependencies = [
+    ('Python', '3.11.3'),
+    ('gperftools', '2.12'),
+]
+
+default_component_specs = {
+    'source_urls': [GITHUB_LOWER_SOURCE],
+    'sources': ['v%(version)s.tar.gz'],
+    'checksums': ['9970f0a0afee1648890293321665e5b2efa04eaec9f1671fcf8048f456f5bb86'],
+}
+
+components = [
+    (name, version, {
+        'easyblock': 'CMakeMake',
+        'separate_build_dir': True,
+        'start_dir': '%(namelower)s-%(version)s',
+    }),
+    ('sentencepiece', version, {
+        'easyblock': 'PythonPackage',
+        'start_dir': '%(namelower)s-%(version)s/python',
+        'prebuildopts': 'export PKG_CONFIG_PATH=%(installdir)s/lib/pkgconfig:$PKG_CONFIG_PATH && ',
+        'preinstallopts': 'export PKG_CONFIG_PATH=%(installdir)s/lib/pkgconfig:$PKG_CONFIG_PATH && ',
+        'use_pip': True,
+        'download_dep_fail': True,
+        'sanity_pip_check': True,
+    }),
+]
+
+postinstallcmds = ['cp -a %(builddir)s/%(namelower)s-%(version)s/{data,doc} %(installdir)s/']
+
+sanity_check_paths = {
+    'files': ['bin/spm_%s' % x for x in ['decode', 'encode', 'export_vocab', 'normalize', 'train']] +
+             ['lib/libsentencepiece.%s' % SHLIB_EXT, 'lib/libsentencepiece_train.%s' % SHLIB_EXT] +
+             ['include/sentencepiece_processor.h', 'include/sentencepiece_trainer.h'],
+    'dirs': ['lib/python%(pyshortver)s/site-packages', 'data', 'doc'],
+}
+
+sanity_check_commands = [
+    'spm_train --help',
+    "python -c 'import sentencepiece'",
+]
+
+modextrapaths = {
+    'PYTHONPATH': ['lib/python%(pyshortver)s/site-packages']
+}
+
+moduleclass = 'lib'
diff --git a/easybuild/easyconfigs/t/torchvision/torchvision-0.16.2-foss-2023a-CUDA-12.1.1.eb b/easybuild/easyconfigs/t/torchvision/torchvision-0.16.2-foss-2023a-CUDA-12.1.1.eb
deleted file mode 100644
index a72f7b8760aa..000000000000
--- a/easybuild/easyconfigs/t/torchvision/torchvision-0.16.2-foss-2023a-CUDA-12.1.1.eb
+++ /dev/null
@@ -1,27 +0,0 @@
-name = 'torchvision'
-version = '0.16.2'
-versionsuffix = '-CUDA-%(cudaver)s'
-
-homepage = 'https://github.com/pytorch/vision'
-description = " Datasets, Transforms and Models specific to Computer Vision"
-
-toolchain = {'name': 'foss', 'version': '2023a'}
-
-source_urls = ['https://github.com/pytorch/vision/archive']
-sources = ['v%(version)s.tar.gz']
-patches = ['%(name)s-0.16.2_ffmpeg-6.0-fix.patch']
-checksums = [
-    {'v0.16.2.tar.gz': '8c1f2951e98d8ada6e5a468f179af4be9f56d2ebc3ab057af873da61669806d7'},
-    {'torchvision-0.16.2_ffmpeg-6.0-fix.patch': 'a49336e7bfa1c950e886852bff37a3ea2146ac7bda87241e3ffb31c5cb869cce'},
-]
-
-builddependencies = [('CMake', '3.26.3')]
-
-dependencies = [
-    ('CUDA', '12.1.1', '', SYSTEM),
-    ('Python', '3.11.3'),
-    ('Pillow-SIMD', '9.5.0'),
-    ('PyTorch', '2.1.2', '-CUDA-%(cudaver)s'),
-]
-
-moduleclass = 'vis'

From 47793b27245967dff14ecf186de21be06e13e0a2 Mon Sep 17 00:00:00 2001
From: jfgrimm <jasper.grimm@york.ac.uk>
Date: Tue, 27 Feb 2024 11:39:01 +0000
Subject: [PATCH 5/8] move patch

---
 .../PyTorch-bundle}/torchvision-0.16.2_ffmpeg-6.0-fix.patch       | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 rename easybuild/easyconfigs/{t/torchvision => p/PyTorch-bundle}/torchvision-0.16.2_ffmpeg-6.0-fix.patch (100%)

diff --git a/easybuild/easyconfigs/t/torchvision/torchvision-0.16.2_ffmpeg-6.0-fix.patch b/easybuild/easyconfigs/p/PyTorch-bundle/torchvision-0.16.2_ffmpeg-6.0-fix.patch
similarity index 100%
rename from easybuild/easyconfigs/t/torchvision/torchvision-0.16.2_ffmpeg-6.0-fix.patch
rename to easybuild/easyconfigs/p/PyTorch-bundle/torchvision-0.16.2_ffmpeg-6.0-fix.patch

From 6bb22cff3946a48c69000803b885806fbcccfc83 Mon Sep 17 00:00:00 2001
From: Jasper Grimm <65227842+jfgrimm@users.noreply.github.com>
Date: Tue, 27 Feb 2024 11:59:21 +0000
Subject: [PATCH 6/8] delete unused checksum

---
 .../PyTorch-bundle-2.1.2-foss-2023a-CUDA-12.1.1.eb               | 1 -
 1 file changed, 1 deletion(-)

diff --git a/easybuild/easyconfigs/p/PyTorch-bundle/PyTorch-bundle-2.1.2-foss-2023a-CUDA-12.1.1.eb b/easybuild/easyconfigs/p/PyTorch-bundle/PyTorch-bundle-2.1.2-foss-2023a-CUDA-12.1.1.eb
index 344d73613b22..e6eb6a4aef4c 100644
--- a/easybuild/easyconfigs/p/PyTorch-bundle/PyTorch-bundle-2.1.2-foss-2023a-CUDA-12.1.1.eb
+++ b/easybuild/easyconfigs/p/PyTorch-bundle/PyTorch-bundle-2.1.2-foss-2023a-CUDA-12.1.1.eb
@@ -48,7 +48,6 @@ exts_list = [
             {'torchtext-0.17.1.tar.gz': '1b21c1efb13072465bc11dbb7b80e8bdc3aca3cee9234242f57f0503f3db47f5'},
             {'torchtext-0.14.1_use-system-libs.patch':
              '1366d10c4755b6003194f7313ca11d165a80a13d325bee9d669ea2b333d82536'},
-            {'torchtext-0.13.1_cxx_17.patch': 'fd242c139baa27352d1065cece4658a3ede76f46ffec08ac04a554301e547f22'},
         ],
     }),
     ('torchvision', '0.16.2', {

From d8bb18c88b8e7e7f2ae07ea013651717071eaace Mon Sep 17 00:00:00 2001
From: Jasper Grimm <65227842+jfgrimm@users.noreply.github.com>
Date: Tue, 27 Feb 2024 12:40:22 +0000
Subject: [PATCH 7/8] switch topaz to pytorch bundle

---
 .../t/topaz/topaz-0.2.5.20231120-foss-2023a-CUDA-12.1.1.eb     | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/easybuild/easyconfigs/t/topaz/topaz-0.2.5.20231120-foss-2023a-CUDA-12.1.1.eb b/easybuild/easyconfigs/t/topaz/topaz-0.2.5.20231120-foss-2023a-CUDA-12.1.1.eb
index 877445f182e2..8156c8d8dbc0 100644
--- a/easybuild/easyconfigs/t/topaz/topaz-0.2.5.20231120-foss-2023a-CUDA-12.1.1.eb
+++ b/easybuild/easyconfigs/t/topaz/topaz-0.2.5.20231120-foss-2023a-CUDA-12.1.1.eb
@@ -20,9 +20,8 @@ dependencies = [
     ('CUDA', '12.1.1', '', SYSTEM),
     ('Python', '3.11.3'),
     ('SciPy-bundle', '2023.07'),
-    ('PyTorch', '2.1.2', versionsuffix),
+    ('PyTorch-bundle', '2.1.2', versionsuffix),
     ('scikit-learn', '1.3.1'),
-    ('torchvision', '0.16.2', versionsuffix),
     ('scikit-image', '0.22.0'),
 ]
 

From 7cc4df1c222092b79d687b876574207c88384f9c Mon Sep 17 00:00:00 2001
From: Jasper Grimm <65227842+jfgrimm@users.noreply.github.com>
Date: Fri, 12 Apr 2024 15:19:14 +0100
Subject: [PATCH 8/8] Update
 easybuild/easyconfigs/s/SentencePiece/SentencePiece-0.2.0-GCC-12.3.0.eb

---
 .../s/SentencePiece/SentencePiece-0.2.0-GCC-12.3.0.eb            | 1 -
 1 file changed, 1 deletion(-)

diff --git a/easybuild/easyconfigs/s/SentencePiece/SentencePiece-0.2.0-GCC-12.3.0.eb b/easybuild/easyconfigs/s/SentencePiece/SentencePiece-0.2.0-GCC-12.3.0.eb
index e620faf028f2..1ff1c337cf7b 100644
--- a/easybuild/easyconfigs/s/SentencePiece/SentencePiece-0.2.0-GCC-12.3.0.eb
+++ b/easybuild/easyconfigs/s/SentencePiece/SentencePiece-0.2.0-GCC-12.3.0.eb
@@ -43,7 +43,6 @@ components = [
                         '$PKG_CONFIG_PATH && ',
         'preinstallopts': 'export PKG_CONFIG_PATH=%(installdir)s/lib64/pkgconfig:%(installdir)s/lib/pkgconfig/:'
                           '$PKG_CONFIG_PATH && ',
-
         'use_pip': True,
         'download_dep_fail': True,
         'sanity_pip_check': True,