diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml index 08e669a..87b7e1c 100644 --- a/.github/workflows/ci.yml +++ b/.github/workflows/ci.yml @@ -21,10 +21,10 @@ jobs: - name: "Build Docker image" run: | docker build . -f containers/Dockerfile \ - -t ghcr.io/edinburgh-genome-foundry/sequeduct_methyl:v0.1.1 \ + -t ghcr.io/edinburgh-genome-foundry/sequeduct_methyl:v0.1.2 \ -t ghcr.io/edinburgh-genome-foundry/sequeduct_methyl:latest - name: "Release Docker image" run: | - docker push ghcr.io/edinburgh-genome-foundry/sequeduct_methyl:v0.1.1 + docker push ghcr.io/edinburgh-genome-foundry/sequeduct_methyl:v0.1.2 docker push ghcr.io/edinburgh-genome-foundry/sequeduct_methyl:latest \ No newline at end of file diff --git a/README.md b/README.md index be0a5c6..26f6458 100644 --- a/README.md +++ b/README.md @@ -39,7 +39,7 @@ dorado download --model dna_r10.4.1_e8.2_400bps_hac@v5.0.0 Pull the Sequeduct Methyl Nextflow pipeline: ```bash -nextflow pull edinburgh-genome-foundry/Sequeduct_Methyl -r v0.1.1 +nextflow pull edinburgh-genome-foundry/Sequeduct_Methyl -r v0.1.2 ``` ### Run @@ -51,7 +51,7 @@ Change to the directory you wish to create your pipeline analysis output in. Cop The following should be run on the command line: ```bash -nextflow run edinburgh-genome-foundry/Sequeduct_Methyl -r v0.1.1 -entry analysis \ +nextflow run edinburgh-genome-foundry/Sequeduct_Methyl -r v0.1.2 -entry analysis \ --pod5_dir='path/to/pod5_pass' \ --genbank_dir='path/to/genbank_ref/dir' \ --sample_sheet='path/to/sample_sheet.csv' \ @@ -97,7 +97,7 @@ docker pull ghcr.io/edinburgh-genome-foundry/sequeduct_methyl:latest Subsequently, the command below is run to convert the FAST5 to POD5. Insert the path from your current directory to the sample sheet using `--sample_sheet` and the full path to the main directory containing subdirectories for each sample with FAST5 files using `--fast5_dir`. ```bash -nextflow run edinburgh-genome-foundry/Sequeduct_Methyl -r v0.1.1 -entry converter \ +nextflow run edinburgh-genome-foundry/Sequeduct_Methyl -r v0.1.2 -entry converter \ --sample_sheet 'path/to/sample_sheet.csv' \ --fast5_dir '/full/path/to/fast5_pass' \ -with-docker converter_docker diff --git a/conf/base.config b/conf/base.config index 09d7ddc..2ed2342 100644 --- a/conf/base.config +++ b/conf/base.config @@ -2,7 +2,7 @@ manifest { name = 'Sequeduct Methyl' description = 'Methylation sequencing analysis pipeline (aqueduct) for validating plasmids nucleotide modifications, using long reads.' - version = '0.1.1' + version = '0.1.2' homePage = 'https://github.com/Edinburgh-Genome-Foundry/Sequeduct_Methyl.git' author = 'Jennifer Claire Muscat' nextflowVersion = '>=23.10.1' @@ -40,7 +40,7 @@ profiles { charliecloud.enabled = false // specify the container to be used - process.container = "ghcr.io/edinburgh-genome-foundry/sequeduct_methyl:v0.1.1" + process.container = "ghcr.io/edinburgh-genome-foundry/sequeduct_methyl:v0.1.2" } singularity { @@ -52,7 +52,7 @@ profiles { charliecloud.enabled = false // specify the container to be used - process.container = "ghcr.io/edinburgh-genome-foundry/sequeduct_methyl:v0.1.1" + process.container = "ghcr.io/edinburgh-genome-foundry/sequeduct_methyl:v0.1.2" } // Son of Grid Engine configuration diff --git a/demo/README.md b/demo/README.md index d79e373..6167014 100644 --- a/demo/README.md +++ b/demo/README.md @@ -9,7 +9,7 @@ All extra files required for a demonstration run of Sequeduct Methyl are availab Sequeduct Methyl requires four input files in total. The `pod5_dir` and GenBank-format reference file from the [demo](https://github.com/Edinburgh-Genome-Foundry/Sequeduct_Methyl/tree/main/demo) directory should be downloaded in a directory you wish to run the pipeline from. Additionally, download the `sample_sheet.csv` and `param_sheet.csv` from the [sheets](https://github.com/Edinburgh-Genome-Foundry/Sequeduct_Methyl/tree/main/demo/sheets) directory, and then the following can be run. Note that `--model_path` requires the full path to the basecalling model `dna_r10.4.1_e8.2_400bps_hac@v5.0.0` by [Dorado](https://github.com/nanoporetech/dorado). ```bash -nextflow run edinburgh-genome-foundry/Sequeduct_Methyl -r v0.1.1 -entry analysis \ +nextflow run edinburgh-genome-foundry/Sequeduct_Methyl -r v0.1.2 -entry analysis \ --pod5_dir='./pod5_pass' \ --genbank_dir='./genbank' \ --sample_sheet='./sheets/sample_sheet.csv' \ @@ -63,7 +63,7 @@ The final page contains an Appendix that further explains the structure of the r ## Interpreting Pipeline Results * Inspect both the bedMethyl file saved for each barcode and sample, for example `barcode1_EGF_met_1.bed` as well as the final PDF report `EpiJinn_report.pdf`. -* Review the main components constituting the reference plasmid from the 'plot of the sequence' per sample in the PDF report. +* Review the main components constituting the reference plasmid from the 'plot of the sequence' per sample in the PDF report and compare this to the plasmid map of the reference GenBank-format file on a sequence editor. * Observe the plots illustrating the methylated positions in the plasmid sequence per barcode. Each plot includes all methylation pattern of the specified methylase found in the plasmid. Patterns continaing a methylated base are shown in red, whilst bases with undetermined modification statuses are shown in yellow. Arrows refer to the strand the modification is present on. * Locate the methylated positions per barcode shown in red (with status '1') and the undetermined positions in yellow (with status 'U'). Patterns labelled as unmethylated in grey are marked with status '0'. Match the location of the methylated positions stated in the bedMethyl tables to the reference sequence plot to identify the regions of the plasmid that the modifications occur in, taking the strand into consideration. * Take note of the coverage for the positions marked as methylated (in red) in the PDF report. Positions with a methylated status that contain a low coverage may not reflect a genuine modified position. Therefore, positions with coverages below a chosen threshold may excluded from being classified as methylated due to this uncertainty.