nf-core · toniher · Mar 25, 2026 · Mar 25, 2026 · Mar 26, 2026 · Mar 26, 2026
diff --git a/modules/nf-core/huggingface/download/environment.yml b/modules/nf-core/huggingface/download/environment.yml
@@ -0,0 +1,6 @@
+---
+# yaml-language-server: $schema=https://raw.githubusercontent.com/nf-core/modules/master/modules/environment-schema.json
+channels:
+  - conda-forge
+dependencies:
+  - conda-forge::huggingface_hub=1.6.0
diff --git a/modules/nf-core/huggingface/download/main.nf b/modules/nf-core/huggingface/download/main.nf
@@ -0,0 +1,30 @@
+process HUGGINGFACE_DOWNLOAD {
+    tag "${meta.id}"
+    label 'process_medium'
+
+    conda "${moduleDir}/environment.yml"
+    container "community.wave.seqera.io/library/huggingface_hub:1.6.0--c106a7f9664ca39b"
+
+    input:
+    tuple val(meta), val(hf_repo), val(hf_file), val(hf_home)
+
+    output:
+    tuple val(meta), path(hf_file), emit: output
+    tuple val("${task.process}"), val("huggingface_hub"), eval("hf --version 2>&1 | tail -n1 | awk '{print \$NF}'"), topic: versions, emit: versions_huggingface_hub
+
+    when:
+    task.ext.when == null || task.ext.when
+
+    script:
+    def hf_home_resolved = hf_home ?: "${workflow.workDir}/hf_cache"
+    """
+    export HF_HOME="${hf_home_resolved}"
+    export HF_HUB_CACHE=\$HF_HOME
+    hf download ${hf_repo} ${hf_file} --local-dir \$PWD
+    """
+
+    stub:
+    """
+    touch ${hf_file}
+    """
+}
diff --git a/modules/nf-core/huggingface/download/meta.yml b/modules/nf-core/huggingface/download/meta.yml
@@ -0,0 +1,67 @@
+name: huggingface_download
+description: Command-line interface for downloading models in GGUF format from Hugging Face Hub
+keywords:
+  - ai
+  - gguf
+  - llama
+  - llm
+tools:
+  - huggingface_hub:
+      description: "Command-line interface for interacting with Hugging Face Hub, allowing to download, upload and interact with models and datasets"
+      homepage: "https://huggingface.co/docs/huggingface_hub/guides/cli"
+      licence:
+        - "MIT"
+      identifier: ""
+input:
+  - - meta:
+        type: map
+        description: |
+          Groovy Map containing sample information
+          e.g. `[ id:'sample1' ]`- prompt_file:
+    - hf_repo:
+        type: string
+        description: Hugging Face repository
+    - hf_file:
+        type: string
+        description: Hugging Face GGUF file
+    - hf_home:
+        type: string
+        description: Hugging Face default cache directory
+output:
+  output:
+    - - meta:
+          type: map
+          description: |
+            Groovy Map containing sample information
+            e.g. `[ id:'sample1' ]`
+      - hf_file:
+          type: file
+          description: Downloaded Hugging Face GGUF file
+          ontologies: []
+  versions_huggingface_hub:
+    - - ${task.process}:
+          type: string
+          description: The name of the process
+      - huggingface_hub:
+          type: string
+          description: The name of the tool
+      - hf --version 2>&1 | tail -n1 | awk '{print \$NF}':
+          type: eval
+          description: The expression to obtain the version of the tool
+topics:
+  versions:
+    - - ${task.process}:
+          type: string
+          description: The name of the process
+      - huggingface_hub:
+          type: string
+          description: The name of the tool
+      - hf --version 2>&1 | tail -n1 | awk '{print \$NF}':
+          type: eval
+          description: The expression to obtain the version of the tool
+authors:
+  - "@toniher"
+  - "@lucacozzuto"
+maintainers:
+  - "@toniher"
+  - "@lucacozzuto"
diff --git a/modules/nf-core/huggingface/download/tests/main.nf.test b/modules/nf-core/huggingface/download/tests/main.nf.test
@@ -0,0 +1,90 @@
+nextflow_process {
+
+    name "Test Process HUGGINGFACE_DOWNLOAD"
+    script "../main.nf"
+    process "HUGGINGFACE_DOWNLOAD"
+
+    tag "modules"
+    tag "modules_nfcore"
+    tag "huggingface"
+    tag "huggingface/download"
+
+    test("download gguf file - gemma3") {
+
+        when {
+            process {
+                """
+                input[0] = [
+                    [ id:'test_model_gemma3' ],
+                    "ggml-org/gemma-3-1b-it-GGUF",
+                    "gemma-3-1b-it-Q4_K_M.gguf",
+                    "./hf_cache"
+                ]
+                """
+            }
+        }
+
+        then {
+            assertAll(
+                { assert process.success },
+                { assert process.out.output.size() == 1 },
+                { assert process.out.output[0][0] == [ id:'test_model_gemma3' ] },
+                { assert file(process.out.output[0][1]).name == "gemma-3-1b-it-Q4_K_M.gguf" },
+                { assert file(process.out.output[0][1]).size() > 0 },
+                { assert snapshot(process.out.findAll { key, val -> key.startsWith('versions') }).match() }
+            )
+        }
+    }
+
+    test("download gguf file - smollm3") {
+
+        when {
+            process {
+                """
+                input[0] = [
+                    [ id:'test_model_smollm3' ],
+                    "unsloth/SmolLM3-3B-GGUF",
+                    "SmolLM3-3B-UD-IQ2_XXS.gguf",
+                    "./hf_cache"
+                ]
+                """
+            }
+        }
+
+        then {
+            assertAll(
+                { assert process.success },
+                { assert process.out.output.size() == 1 },
+                { assert process.out.output[0][0] == [ id:'test_model_smollm3' ] },
+                { assert file(process.out.output[0][1]).name == "SmolLM3-3B-UD-IQ2_XXS.gguf" },
+                { assert file(process.out.output[0][1]).size() > 0 },
+                { assert snapshot(process.out.findAll { key, val -> key.startsWith('versions') }).match() }
+            )
+        }
+    }
+
+    test("stub - download gguf file - gemma3") {
+
+        options "-stub"
+
+        when {
+            process {
+                """
+                input[0] = [
+                    [ id:'test_model_gemma3' ],
+                    "ggml-org/gemma-3-1b-it-GGUF",
+                    "gemma-3-1b-it-Q4_K_M.gguf",
+                    "./hf_cache"
+                ]
+                """
+            }
+        }
+
+        then {
+            assertAll(
+                { assert process.success },
+                { assert snapshot(sanitizeOutput(process.out)).match() }
+            )
+        }
+    }
+}
diff --git a/modules/nf-core/huggingface/download/tests/main.nf.test.snap b/modules/nf-core/huggingface/download/tests/main.nf.test.snap
@@ -0,0 +1,64 @@
+{
+    "stub - download gguf file - gemma3": {
+        "content": [
+            {
+                "output": [
+                    [
+                        {
+                            "id": "test_model_gemma3"
+                        },
+                        "gemma-3-1b-it-Q4_K_M.gguf:md5,d41d8cd98f00b204e9800998ecf8427e"
+                    ]
+                ],
+                "versions_huggingface_hub": [
+                    [
+                        "HUGGINGFACE_DOWNLOAD",
+                        "huggingface_hub",
+                        "1.6.0"
+                    ]
+                ]
+            }
+        ],
+        "timestamp": "2026-04-04T22:00:17.896195894",
+        "meta": {
+            "nf-test": "0.9.5",
+            "nextflow": "25.10.4"
+        }
+    },
+    "download gguf file - gemma3": {
+        "content": [
+            {
+                "versions_huggingface_hub": [
+                    [
+                        "HUGGINGFACE_DOWNLOAD",
+                        "huggingface_hub",
+                        "1.6.0"
+                    ]
+                ]
+            }
+        ],
+        "timestamp": "2026-04-04T21:36:18.125789808",
+        "meta": {
+            "nf-test": "0.9.5",
+            "nextflow": "25.10.4"
+        }
+    },
+    "download gguf file - smollm3": {
+        "content": [
+            {
+                "versions_huggingface_hub": [
+                    [
+                        "HUGGINGFACE_DOWNLOAD",
+                        "huggingface_hub",
+                        "1.6.0"
+                    ]
+                ]
+            }
+        ],
+        "timestamp": "2026-04-04T21:55:38.228583826",
+        "meta": {
+            "nf-test": "0.9.5",
+            "nextflow": "25.10.4"
+        }
+    }
+}
diff --git a/modules/nf-core/huggingface/download/tests/nextflow.config b/modules/nf-core/huggingface/download/tests/nextflow.config
@@ -0,0 +1,5 @@
+process {
+    withName: 'HUGGINGFACE_DOWNLOAD' {
+        containerOptions = { workflow.profile.contains('docker') ? "--volume ${workDir}/hf_cache:${workDir}/hf_cache" : '' }
+    }
+}
 containers: 
 containers: 
@@ -0,0 +1,5 @@
+FROM nvidia/cuda:12.4.1-devel-ubuntu22.04
+
+RUN apt-get update && apt-get install -y python3 python3-pip
+RUN pip3 install llama-cpp-python  \
+    --extra-index-url https://abetlen.github.io/llama-cpp-python/whl/cu124
diff --git a/modules/nf-core/llamacpppython/run/environment.yml b/modules/nf-core/llamacpppython/run/environment.yml
@@ -0,0 +1,7 @@
+---
+# yaml-language-server: $schema=https://raw.githubusercontent.com/nf-core/modules/master/modules/environment-schema.json
+channels:
+  - conda-forge
+  - bioconda
+dependencies:
+  - conda-forge::llama-cpp-python=0.3.16
diff --git a/modules/nf-core/llamacpppython/run/main.nf b/modules/nf-core/llamacpppython/run/main.nf
@@ -0,0 +1,35 @@
+process LLAMACPPPYTHON_RUN {
+    tag "${meta.id}"
+    label 'process_medium'
+    label 'process_gpu'
+
+    conda "${moduleDir}/environment.yml"
+    container "${task.ext.use_gpu ? 'quay.io/nf-core/llama-cpp-python:0.1.9' : 'community.wave.seqera.io/library/llama-cpp-python:0.3.16--b351398cd0ea7fc5'}"
+
+    input:
+    tuple val(meta), path(prompt_file), path(gguf_model)
+
+    output:
+    tuple val(meta), path("${prefix}.txt"), emit: output
+    tuple val("${task.process}"), val("llama-cpp-python"), eval("python3 -c 'import llama_cpp; print(llama_cpp.__version__)'"), topic: versions, emit: versions_llama_cpp_python
+
+    when:
+    task.ext.when == null || task.ext.when
+
+    script:
+    def args = task.ext.args ?: ''
+    prefix = task.ext.prefix ?: "${meta.id}"
+    """
+    llama-cpp-python.py \
+        --model ${gguf_model} \
+        --messages ${prompt_file} \
+        --output ${prefix}.txt \
+        ${args}
+    """
+
+    stub:
+    prefix = task.ext.prefix ?: "${meta.id}"
+    """
+    touch ${prefix}.txt
+    """
+}
diff --git a/modules/nf-core/llamacpppython/run/meta.yml b/modules/nf-core/llamacpppython/run/meta.yml
@@ -0,0 +1,72 @@
+name: llamacpppython_run
+description: Python wrapper for running locally-hosted LLM with llama.cpp
+keywords:
+  - ai
+  - inference
+  - llama
+  - llm
+  - local-inference
+  - offline-llm
+tools:
+  - llama-cpp-python:
+      description: "Python wrapper for llama.cpp LLM inference tool"
+      homepage: "https://llama-cpp-python.readthedocs.io/en/latest/"
+      licence:
+        - "MIT"
+      identifier: ""
+input:
+  - - meta:
+        type: map
+        description: |
+          Groovy Map containing sample information
+          e.g. `[ id:'sample1' ]`- prompt_file:
+    - prompt_file:
+        type: file
+        description: |
+          Prompt file
+          Structure: [ val(meta), path(prompt_file) ]
+        ontologies: []
+    - gguf_model:
+        type: file
+        description: |
+          GGUF model
+          Structure: [ val(meta), path(gguf_model) ]
+        ontologies: []
+output:
+  output:
+    - - meta:
+          type: map
+          description: |
+            Groovy Map containing sample information
+            e.g. `[ id:'sample1' ]`
+      - ${prefix}.txt:
+          type: file
+          description: File with the output of LLM inference request
+          ontologies: []
+  versions_llama_cpp_python:
+    - - ${task.process}:
+          type: string
+          description: The name of the process
+      - llama-cpp-python:
+          type: string
+          description: The name of the tool
+      - python3 -c 'import llama_cpp; print(llama_cpp.__version__)':
+          type: eval
+          description: The expression to obtain the version of the tool
+topics:
+  versions:
+    - - ${task.process}:
+          type: string
+          description: The name of the process
+      - llama-cpp-python:
+          type: string
+          description: The name of the tool
+      - python3 -c 'import llama_cpp; print(llama_cpp.__version__)':
+          type: eval
+          description: The expression to obtain the version of the tool
+authors:
+  - "@toniher"
+  - "@lucacozzuto"
+maintainers:
+  - "@toniher"
+  - "@lucacozzuto"