diff --git a/pipelines/nf-atacseq/assets/email_template.html b/pipelines/nf-atacseq/assets/email_template.html
new file mode 100644
index 0000000..161c1e4
--- /dev/null
+++ b/pipelines/nf-atacseq/assets/email_template.html
@@ -0,0 +1,48 @@
+
+
+
+
+

+
+
${workflow.manifest.name} v${workflow.manifest.version}
+
Run Name: $runName
+
+<% if (!success) { %>
+
+
⚠️ ${workflow.manifest.name} execution completed unsuccessfully!
+
The exit status of the task that caused the workflow execution to fail was: $exitStatus.
+
The full error message was:
+
${errorReport}
+
+<% } else { %>
+
+${workflow.manifest.name} execution completed successfully!
+
+<% } %>
+
+
The workflow was completed at $dateComplete (duration: $duration)
+
The command used to launch the workflow was as follows:
+
$commandLine
+
+
Pipeline Configuration:
+
+| Nextflow Version | $nextflowVersion |
+| Run Name | $runName |
+| Session ID | $sessionId |
+<% if (summary.size() > 0) { %>
+<% for (e in summary) { %>| ${e.key} | ${e.value} |
+<% } %>
+<% } %>
+
+
+
--- ${workflow.manifest.name}
+
+
+
+
diff --git a/pipelines/nf-atacseq/assets/nf-core-pipeline_logo_light.png b/pipelines/nf-atacseq/assets/nf-core-pipeline_logo_light.png
new file mode 100644
index 0000000..476ce66
Binary files /dev/null and b/pipelines/nf-atacseq/assets/nf-core-pipeline_logo_light.png differ
diff --git a/pipelines/nf-atacseq/environment.yml b/pipelines/nf-atacseq/environment.yml
new file mode 100644
index 0000000..8ba8147
--- /dev/null
+++ b/pipelines/nf-atacseq/environment.yml
@@ -0,0 +1,23 @@
+---
+# yaml-language-server: $schema=https://raw.githubusercontent.com/nf-core/modules/master/modules/environment-schema.json
+# Conda environment for nf-atacseq local Python/WASP2 modules
+# (wasp2_make_reads, wasp2_filter_remapped, wasp2_count_variants, wasp2_find_imbalance)
+channels:
+ - conda-forge
+ - bioconda
+dependencies:
+ - python>=3.10
+ - numpy>=1.21,<2.0
+ - pandas>=2.0
+ - polars>=0.19
+ - scipy>=1.10
+ - pysam
+ - pybedtools
+ - samtools
+ - bcftools
+ - bedtools
+ - typer
+ - rich
+ - pip
+ - pip:
+ - wasp2==1.2.1
diff --git a/pipelines/nf-atacseq/modules.json b/pipelines/nf-atacseq/modules.json
index 0d78430..bb4626c 100644
--- a/pipelines/nf-atacseq/modules.json
+++ b/pipelines/nf-atacseq/modules.json
@@ -1,5 +1,5 @@
{
"name": "wasp2/nf-atacseq",
- "homePage": "",
+ "homePage": "https://github.com/mcvickerlab/WASP2",
"repos": {}
}
diff --git a/pipelines/nf-atacseq/nextflow.config b/pipelines/nf-atacseq/nextflow.config
index e844cbf..8e709e1 100644
--- a/pipelines/nf-atacseq/nextflow.config
+++ b/pipelines/nf-atacseq/nextflow.config
@@ -15,6 +15,8 @@ plugins {
manifest {
name = 'wasp2/nf-atacseq'
author = 'WASP2 Team'
+ homePage = 'https://github.com/mcvickerlab/WASP2'
+ doi = 'https://doi.org/10.1038/nmeth.3582'
description = 'ATAC-seq Allelic Imbalance Pipeline with WASP2 mapping bias correction'
mainScript = 'main.nf'
nextflowVersion = '!>=23.04.0'
@@ -73,6 +75,7 @@ params {
help = false
version = false
tracedir = "${params.outdir}/pipeline_info"
+ validate_params = true
}
// Load configuration files
@@ -97,7 +100,6 @@ profiles {
conda.enabled = true
docker.enabled = false
singularity.enabled = false
- process.conda = "${projectDir}/../../environment.yml"
}
docker {
docker.enabled = true
@@ -153,15 +155,15 @@ profiles {
def trace_timestamp = new java.util.Date().format('yyyy-MM-dd_HH-mm-ss')
timeline {
enabled = true
- file = "${params.tracedir}/execution_timeline_${trace_timestamp}.html"
+ file = "${params.tracedir}/timeline_${trace_timestamp}.html"
}
report {
enabled = true
- file = "${params.tracedir}/execution_report_${trace_timestamp}.html"
+ file = "${params.tracedir}/report_${trace_timestamp}.html"
}
trace {
enabled = true
- file = "${params.tracedir}/execution_trace_${trace_timestamp}.txt"
+ file = "${params.tracedir}/trace_${trace_timestamp}.txt"
}
dag {
enabled = true
@@ -184,7 +186,7 @@ process {
withName: 'WASP2_MAKE_READS|WASP2_FILTER_REMAPPED|WASP2_COUNT_VARIANTS|WASP2_FIND_IMBALANCE' {
container = wasp2_container
}
- withName: 'BWA_MEM' {
+ withName: 'BWA_INDEX|BWA_MEM' {
container = bwa_samtools_container
}
withName: 'SAMTOOLS_INDEX|SAMTOOLS_FAIDX|SAMTOOLS_STATS|SAMTOOLS_FLAGSTAT|SAMTOOLS_IDXSTATS|SAMTOOLS_SORT' {
@@ -201,27 +203,24 @@ def check_max(obj, type) {
try {
if (obj.compareTo(params.max_memory as nextflow.util.MemoryUnit) == 1)
return params.max_memory as nextflow.util.MemoryUnit
- else
- return obj
- } catch (all) {
- println "WARNING: Invalid max_memory '${params.max_memory}', using default"
+ else return obj
+ } catch (Exception e) {
+ log.warn "Invalid memory config (${obj}, max=${params.max_memory}): ${e.message}. Using ${obj}"
return obj
}
} else if (type == 'time') {
try {
if (obj.compareTo(params.max_time as nextflow.util.Duration) == 1)
return params.max_time as nextflow.util.Duration
- else
- return obj
- } catch (all) {
- println "WARNING: Invalid max_time '${params.max_time}', using default"
+ else return obj
+ } catch (Exception e) {
+ log.warn "Invalid time config (${obj}, max=${params.max_time}): ${e.message}. Using ${obj}"
return obj
}
} else if (type == 'cpus') {
- try {
- return Math.min(obj, params.max_cpus as int)
- } catch (all) {
- println "WARNING: Invalid max_cpus '${params.max_cpus}', using default"
+ try { return Math.min(obj, params.max_cpus as int) }
+ catch (Exception e) {
+ log.warn "Invalid CPU config (${obj}, max=${params.max_cpus}): ${e.message}. Using ${obj}"
return obj
}
}
diff --git a/pipelines/nf-atacseq/tests/data/annotation.gtf b/pipelines/nf-atacseq/tests/data/annotation.gtf
deleted file mode 120000
index 993462d..0000000
--- a/pipelines/nf-atacseq/tests/data/annotation.gtf
+++ /dev/null
@@ -1 +0,0 @@
-../../../../tests/shared_data/annotation.gtf
\ No newline at end of file
diff --git a/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa b/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa
index 923c055..182b3f7 100644
--- a/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa
+++ b/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa
@@ -1,331 +1,335 @@
>chr_test
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-AAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTT
-AAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTT
-AAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTT
-AAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTT
-AAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTT
-AAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTT
-AAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTT
-AAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTT
-AAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTTAAACCCGGGTTT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-TGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGAC
-TGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGAC
-TGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGAC
-TGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGAC
-TGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGAC
-TGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGAC
-TGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGAC
-TGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGAC
-TGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGACTGAC
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-GTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCA
-GTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCA
-GTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCA
-GTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCA
-GTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCA
-GTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCA
-GTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCA
-GTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCA
-GTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCA
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-TCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAG
-TCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAG
-TCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAG
-TCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAG
-TCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAG
-TCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAG
-TCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAG
-TCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAG
-TCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAG
-AGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTC
-AGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTC
-AGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTC
-AGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTC
-AGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTC
-AGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTC
-AGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTC
-AGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTC
-AGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTCAGTC
-CATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATG
-CATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATG
-CATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATG
-CATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATG
-CATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATG
-CATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATG
-CATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATG
-CATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATG
-CATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-GCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCAT
-GCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCAT
-GCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCAT
-GCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCAT
-GCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCAT
-GCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCAT
-GCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCAT
-GCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCAT
-GCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCAT
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-CATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATG
-CATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATG
-CATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATG
-CATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATG
-CATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATG
-CATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATG
-CATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATG
-CATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATG
-CATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-ATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGCATGC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-GATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATC
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-CGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGAT
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-TCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGATCGA
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-ACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGT
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-GTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTAC
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
-TACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACGTACG
+GAAAGGCATAATAAGTAGCACGTACTAACGCGTCTTCGCTGAAAATAGTTAACGGAGATC
+GTGCGAATAACCTGTCTAATAGCTACTAAAGCTATCTCCAGGTAGATTCCATACCTGGAG
+TGTATACCCTACCATAGGATTACTATGATCGTTAATGAAAGACCAAGAACTTGCAATTTG
+GCATTCAATTAACTCTACCCCATATATCAGTTCCTGATCTTGAGTCACAAGGAACAGGTG
+TCAGATGTTGATCCAAACCCTACGGCGACTGCAAATAGGAGATCCATAAGGAGTTAACCT
+CGAATCCCCAAAGCTGACCCCAGTCCCCAGACCACTTCAAATCCAGTCTCACACAATGTG
+TTTAGACTGGGTAGTTCGTTTTATCGCGTTAATTGTTATCCAATGTCGGAAAATCATGAG
+TAGAGGATACTAACTCGCGCCGGTCTCGTAAGGTGAAAATTAAGGATTTATCGGCGTATG
+CCTGTGAATATGTATAGATTAGATATATGTGCAAATCTGGGGCAAAAGTAGGAGGACCAA
+TGCTGAGGAGCGACGTTTTCCACGCGTGCACTTTGACCACATGTACAACTCGAACAGTGG
+GTCAAGTGTTTGTGAAAAGGAATGCTAAAATTACTGACTCTTTAACTCTAGAATTCAGGC
+ATTTCCTGGGCAAGAAAATGTAGGTGCGGGCTTGCCAATGTAAGGCTTAATTAACCTCCG
+AAGTGCAGGTATTGCTGACCTTTTCTTCGTTATGGGATCTGACGAATTACCTACTGTACC
+ATTCTCCACTCTCATGCTATTTTAAGTAGAGGCTGCCTATGCCTTTGTGATCTGGCCCTT
+GGCAAGCCGTAGCTGCACTTATTCAACGACATAAACCGATTGGTACATTATTCTCGATGG
+AGTCACGTGGGGCGCGTTTGATGAATCTCCACTCGTACACCGCCCTCATTGGGCCAAACT
+CAACCTTACTTACATGGCTGATATTCATTCCAGTCTTAACTGGGAGAATAGAACTACACA
+AAAGAAGATAAGTGTGTATCAGCTTCATTGTCAAGAAGTTCTTGAGCGGGATATTTATGT
+ACACAAGCTGTTATGGCGCGTTAGAACTGTCCCCGGACCAAGTTACTTAGAGATTTGGTA
+AAGGAGTTAGATAGTGATGATAAATAGATGTCCACAACCTTGTAATCGCCACAGTTTTAT
+ATCTGCCAAAGGGAGTGGTCTGGCGAATTAATTTACACCGTTTCCTCGTTAAACTGTAAT
+TTATATTGGGAAGAGGCCTGATCGTGCTTCCGCGGTGTTTAACTAAACAGCCATGATACG
+CATTGATAGTTTCTCTCCTATTCCCAAGCTACCAGACATCATTAATACTACCGCAACGAG
+TAAACTGTAATATCTACGATAATGATGACATTCTTTGCAAGTGGGGTATCAGTGGCAGTT
+AAACTCTAGATGCTATCGCTCTTCTCGAGCTTAGTGTGTACTCACCAGTCGCAGGAAGTT
+TGGCTGTTTGAAGTTTAATCACTACTCTAGCTTATCCGCGCTAAACATTCTGATCGTGCA
+CGTGTCGGACTCAAAATGTCCCAGTATTTACAGGGCTCAAGTGGTGTGACTCGTAATTAG
+TGGCCATTTTAAATTGACATTTGTTTTACTCATATCGTTCTCGGTTTATATGACGACTCT
+CGATTAATTTGTTGACGTTCTGTCTGCGCGGATCGGTGGAGGCAGACAATAGTGCCGAAA
+TGTTACTTGGGGAATACTAAGTTCCAAGTCCCCTAGTTATATCGAGGAGTGATGAGATCT
+CCTACTGCATTGCCACACCTTCCCCATACACTTCCTAAATAAGCTGACCCTAGAATAAAG
+CTGAGGAATTTCGTACTGAAAGGTTTTGAAGCATGATATTTATTAAGATCTTTATCGTCG
+TATACCACATGGCGTCTCCTGGTGTATTGAAATGTTCATACGACTGCAAAAGGAGTAACA
+TACGTGGTTAGATACCCGTTCCGGTTATGTCTGCCTCTAAAGCCAGAAGGCAGGTTCTCA
+CCACTAGACTGTTTATTACTCCTTTAAACTTATTCTGGACCGTACAGTCTGAACCGGTCA
+GATTGGGTTATATACACGCCAAAATCATTTTCAGCGCGATTAAATTGTCATAACCTAACC
+TACTCGGGTAAACTCTGACGTCATCTGCTGAACTTCTGGAGCGAAGGGTAATTAAATTTA
+TAGTTTTACCCTATATTATTTAAAGGAATCTGCTTCCCATCATCCTGTTATCTATGTGTC
+TGTTGCCTTGAGGGACTTTCGTCTCTGAGGTGACGTGCTAATTGTTTGGTTAATCACATT
+ATTTGTTCACGGACAAATCATAGTAGAGTGAGCAACATTACTGGGGTCGCGTGAAATAGT
+TATAGGGCTTATTATAACCTTGTCTAAGTATATGGTAAGCTCAGTCACGTCTTCTCGACG
+TGGAAAATATTGAACCGACGCCCACAGCGGTTATTGCATACTCTAGGGTGTATATAACTT
+TTGAAGTACTACAGAGACAGATCATTGAGGATAAGAGCCTAATGATCAGGACATAGTGGA
+TGCAAGGTCTAAATGGGGCGTTTGTACCTATGTCCCACTTGGCGAAAACTGTTGATGATT
+ACTTGCGAGGCAATTGTGGAGGACTGGAAGACGACAAGTATTTTAATGATACATTACCTC
+GTTTGAATTCACCCATACTTAATTGTGTGACGAATATCCCAGCGATATACGACCTGTCAA
+ACATTCAATCGGTAAAGGAATTTCATAAAGCGACTAATTGACATTGATCAACCACTGGGA
+CAACTACCTATATCTAGAAAACAGATTTAAAACTGCCCGTTTCTTATACGACTGCCAGAC
+CACACCTCCAGCGCAGCTTACCTTTAAATACAAGCCTAGCGCCCTCTATAACCCGACGCG
+AGATGAGCCTCCAGCCATCAGACACAGGCTAAAATTGCCTTTATCGGAACTTCAATGTCA
+GGTACACAAAAGGGAAAATCATTTGGAAATACTTTGATACTTATAAAGGATTCGTCCTTC
+TCTACGTCCGGAGACCCATCTCGCACCATTTATCGGTTTAGGCCTAATTTTGAAAGGACT
+AGCCACTATGACACTCATGAACGGCCTATTACCAACCATCGACTGAATGACGTACGGATA
+TCCGGATAGGACGGAACTCGTTTATGCTATGCTGGTAACGCAGCTAGCCCGGGGCATTAG
+TAGATGCGTCCCAAAACGAGTATGTGTATCTCGCACTCTTACAATTCTTGGTGAGAAGAG
+TGAGGTCTAATATCAGGAGTATGACTTGGTCCTCTACCTAGAGGATGACATACGGAGTTT
+TAGGTGGAGACAGAAAATTAGTATACTAGCCGAATGAAACTTAAATCTGAGACGATTGCA
+CATCATCCGCAGACATGCGATTAGCCACATAATGGGTTCGTTGAGATGTCTCAGACCCAT
+ACAAGTATCTCTATGATTAAGGTTAGCTAATTGTGGAGATCCTTGAAAGGAGACTTGGAT
+CCGGTGCATTACCTTCATGATGCTTCCGACCTATGGTGCGCGAGTTGCGCTGTATTTGTG
+CACCTAAGAGAAACGTGACACGCGTAGCAGCTCCTTAAGGCCCGGGTGGCTAGAATTTTA
+GATGAATACGGTTTGTAAATTTAAATTAGTCCCAGTCGGCGTCCTTACCTCTACATCACT
+AAGGCTATGCGGCGATTAACTTAATGTAGTGGGGACAGTAGTTGTTATCTCAGCCGTCTT
+AAGTCTGCTTGTAACAACCCCTTTAAGTTAGAGCTTGTGTTTTAAAGTCAGCTTTTAGCC
+ATACAAATAGTGCTTCTGTAGGTTTTGCCGATTACGCGTTATATAACTTTACTGTCCATA
+GTGCTTCTTCTTGTAAAGAATGAACGTTAACAATAGATAAACGTAGGAATCCACGCCAGA
+GTTGATAACTTAATGAGTATAGCCGGTTATACGTGGGGAATACACTAGGTAAGGTTAGAC
+TTAGGTGTTTATTGGCGGTGAATTTGGACAAACTAAAATCGTGGCCGTAGCAAGTAAAAT
+CGTTGTGAAACCTCAGACTATAATCCCCTGCTGGCTTGAAAGCGATCTACAAGCACTTCA
+CGCTAGCAAAGAACGGGGTATGTCCCTCCAATACTTTTGACGTGAAGTGATATGTTAGTC
+AAATAAAATTACACATCCTGGTTTTGACTGTTTTCAAACCATGAGTGTGCTAGAACTGTC
+AAATTAGATCTGCTAAGGCGAAAACTATGAAAGCTAAGACAGCTTCTATCGAGGGTTGTT
+TCTTATACCTTACCTATTAATTTTAGTTATAGCCGAGCTCAAGGAGAAATAAAGGAATTT
+CCTCTCCAGATACCCAGAGTGATGTCTGTTGACTAGACCAAGTAAAGAAGTGTAAAGCCG
+AGGCAACGGCTAGTACTTTGAATGACCTAATATAGTAACGAGGTTTTGTGATACACATAT
+CGTGATGACATCACATCTTGCAAATCCAGTATAGAGTAGTTGCAATTACTTTCTTGTGGT
+AGCACTTGCGTCTTACACGATTCAATATGACATCGGCACGTCGTGTAAGTCTCCAGGAGT
+TATATAAGTTGTAATAATATATGAATTGAGGAAGTCAGTTTGATCGCTAACATGCAACCC
+CAGATAATATATGAGAGGAAAGGAGATACGCACGATCATCTATTCAATTTATTGACTCGC
+CCATAACGATCGGAAACCTTAATCCTGTACCACCTTCATCGGCTTTCCCAGAAGGATAAG
+TGTTGGTCTAAAGAATGCGACCCTTTATAGTTGGGTCGTTCACTTGTTGATTTCTTGATA
+CTGAGCGATTAGGATAGCCGAATTTTCTCTTGCTGACAGTTGTGAAAGATCTACAGTTAG
+ATGTCAAGACGCTCATAGGGGATTCATTTATTTAGATTGGAGGCTGCCAGTTCTATTGTA
+GGCAAGACCCTTTGAAACTTTAGTGGAATTGCCGTGCTTGTGCTGTTAGCCTCAACGCTT
+GCGGTATTATCATAGGCTATTACGTGACCCGAGTGTACGGATATGTTTCTAATTAAAAGT
+ATTAGAAAGTTATGAATAGGCGGTCGGTCGTACCTTGGTAACGCTGGGCTATTTAGGAAC
+CTGCTTTGTCTTCGGTGTAGACTTGTTCACAACGTTGACCCGAAATTTAGTTCTCTCTAA
+CTATTTAGCTCCAGTTTTGTATCCACGAAAGTTCAGTTGGTATTTTAGTCATTTTCTGAT
+GAGCCGTACATGCAGCTATGTTTGTCCAACGGTATAACCGAATCAAACAAAGATCAGTCC
+TAACATCGATGAGTGGAATTGGTTGTACACTGCGACGCTCCTAAGTGGGGATGATGCAAA
+TAAAACGCCGGACAGCTCCGATCGCATCGTAAGTTACATTCGATAGAGCGAATATCAGCG
+AGCTTCTTCGGTACCTTCTGTGCATCATGGAATAGCGTAGGAAGGTATTTCTCAAGAACG
+TGCATCAAGTCAGAAATCTAGCATCACTCCGTCTACCGGTAATGTTCAACGGATAAAGCT
+CGGAGTTCGAATCGGTAAATATGTAGGAACGCTAGAGATTCGAGCAGTACGGTAGTGTAG
+CTATTCACTTAGGCAAGAACTATCGGGGACCACTCGCAGGATTCGATACATGATTCCTAT
+AGCATGATTGCGATGCTGTTGCACTATACTCGACGACGCATGTATAGACAATCGCAGATA
+GAATTTAGGTTGCCCCACTACACAAGTCTGTCTATTGTACACGTTGTGGCTTAGAATCGA
+TTACGACCGGAAATAAATATTTTATCTTATTAGCTGTACCTATCTGGCATTTCTAAGGAC
+AATTGATATGCCTACTTATCCAGTCCACCTCAGAATCCACGATCTTGGAATTACCTTTAA
+ACCTGCTTGAAACAGGTCGTGATTCAATCAAATCTATCTGAAGTCCGTGGAGCATTTTCA
+AAACGCTTTGATACCTTTCCGGTGACACAAAAGGAGGAACTAAAAGGGCACATACCCTAT
+GATATAAAACTCAATGTGTCATTAAACAAAGGTATAAGTCTTTCAACTGACTATGAATGA
+CCACTGCACGAGGAGGTTGTTAGAATGAAAAGCTGAGAAGGCAGTATCTCATCTTTTATC
+TGTAGTAGGGTTCTTTCGTCTAACTGACTATTTGAGGCATTATTCTCAGGCTTTCAGTTG
+TGTTTCGCTAACTAGACATACTACGTCTTATGTGAAGCTACGTCTGGTTGTTAAGTTTCA
+ATCGAGTAAACTTTGAAAACGACCTACAGCCTTGACGAAGCTCCCACAACTGTGATAACT
+AGTTCTTGCCCTGCACGCGCGGATTCTCACCTCTCAACAACCGCGTACCCTTCGCCCGTT
+GCGTAAGGCATGTAATCCGCGCTTGAGCCATACCCACCGGCCAGATTAATCAGTCTGAGA
+CGATACGCAGTTATAGCTGTAATGGGGAAATACCCCGGAAGTTTCTGATCCATTAAAACC
+GCACGGATCTCGACGCAAAACTCCATGTTCCAACAATACGGCTTTAGGCAGGTGCCAACG
+TCGACGCTGGCTAAGTAACTTACCACAGAGGATTCTGAGCTTCTTTGCGTTATTAGATGT
+TTCTAACCTTAAAATAGTAAATAGAATACTGTGGACCAAGGCATAAATGCCGTGCTGGTT
+AAAACCAGGTGCATTTAAAGCTCGATCAAGGCCGGTTTTGGGCTGTTTACTTTCTGAAAT
+AACTGCGATGCCGGCCCGAGGAAGATCTAAACTACCAATGAAATTACAAGTGGCTTCAAG
+GCCAAGCCATTTGAGTACTTGACTTATGTGAGTACTTTCCTAAACCATCAAGGGCAGGGT
+TTGTTGCAATCGTATGGGCGTATATGGACAATTGAACGAGGCAATGTAGATGTCCCTCGT
+GTAGGGGTATGCTAGCAACTTTTGTTATTTCTCCAAGAGCAATGCTCGTATAATCTTCAG
+ACCACTATCTTTCGTGGGTTTTCTCGTATTCCGGCGTCGTATAGTATATCACAAGAGCTC
+GTACATTCTAAAATATTAGTAATTTTCAAGGTGTAATTTTACACGATGTTAGACTCGTTC
+TATCACACTGCTTGGTAGTTTAATATGCTGTAGTACTTGAGGATCGTCGGTGGAACGGTC
+CTAGGATCTAAACTAGTGATTACGAACTCTTTGTGTAAAATATGAGCGTATTCGCACTCA
+GTTGCAATTAAATAGCTAAATGATCGGTAAATATCCGGGGTAAATCAACTTGAGTTTAGA
+GGATCCGTCGTTAAGAGATGATGTACATTCGTCGATTTAGGATCCTAACGTGGCGTTCGT
+ATGAAAAGAGCTGAACTAAATAGGAAAACGTTAACCAGTGACTACGCCCCAACCATTGCA
+AGATGTACCCCAATGATGGTTTTGGTATCGAAACTTCTCTTAATTGTGTTTCTTAAGTAC
+TGGCAAAATTCGAGCCGGCATCGTTTGTTGATAGTTGGGTCTAGGATTTTACACCTTGTG
+TTAGCACTGGGCCATTAATTCAATAGTAACAAGAATACTAATTACCAATGTGCGTGAAAA
+TCTCCTTGACTGGTGCAACGTCATTCACAGTCGGATCTCAAGTTATTAGGTGCTAACTGT
+ATACACCAAATTTAGGATAAGAGCCGGCTTAAGGCTAATCTAGACCCAATATTAATCAAT
+ATTTTACGTAATGCATCCACGCGGCGTGCTCTTGGTGAGCAGCTGGGATTAAACGCGTAG
+GTCGAACTATCGAGGGTTTACAAGAAAGCCAAGTGAAAATGAGACTATTGGCCATCGCGA
+GATTTGAATAAATGTCCCTTGGTACTTATACGTTGGGCGAACGGGGATGAGCCAGGCTGC
+TATCATCGTTTCGAGGTAGCTTCCAAGTGGATGAACTCAAAGACTGGCATTATGTGAAGA
+GCATAGCGCTTTTCCCCGTATTATGGCAGCAGCTGGTTACCCATACTTGTGATCCCCGTA
+ATTCTACTGTCATAGAAGGATGACCGAATCAATGAGCCGGGTGGTGTCCAAAAGCGATCC
+TAATCCTTGCTGATTTACCTTGAGCGGTCACGTCTGTCTCAGCGACATTCGCCTTGCGTT
+AGACTAGGCCGTAAGTAAGGAGTGCACTCCACAACGGCGTAATGCGTGCGGCGAGTAATG
+TATTAGCATGTTAACCACATTCTTGGCAGCCAGATCAAAATCACTTTTCATCTGGTTGTC
+TTAACAATCCGATAGAATCTAATGTAGCGATGCGTACTAGAAATAGTTACAATCTACAGT
+CTTGCTGCACTTGCTGCTAATAATGAGCGAGGACCTATCCCTCCTTAAGCAAGTTCCTTG
+TTCCGTGCGGGGAGCCCTGGCGCTAACTCTTTACATGATTAGTATCGCATGTTGTTACAT
+ATATAATAGATTTACATCATTTCAAATGCAATGATTCGTGCTCCTAAAATGAGTCGTATG
+AATAGCCACAGCGTACGGAAACCTGAATTGATTTGTAATTTAAAGATCAACTTAATCTGT
+GTTGATCAGAGCGAGCATTGCAGAATACCCCTGCATCTAGGAATCGGTGCCAGTGTAAAA
+GCCTGTTAGTAAAACCACGACTATGTAGTGTGTACCACACTCGGAGTGCGTCAAGCGAAG
+TCAAACATGGAAATGAAACCATGCGTACGGAAAAGACCAGTGATTTATAAGGACATTCAC
+ATAGACTCCAAAACTGACCCGATGGAGTCTACGCCGAACAGTTGGTATCAACATTTGTCT
+CGATTTTCTGTTGGGAACATCCATCCCTACCCACAACGTACTGGACCATAATCAAGGGTT
+TGGAACAGTACGCTCCTGTACTCAAGAAGTCCTTGCACGAAAGCAATAGGTTGAACTTCA
+TCATATAGGCGATGACAGTGCTATCAGCCGGACTGGCTGTTCTCGTAGAAGTCACTCGAA
+TCAATAAGATACGAATACTCCATCCTGTACGGGGACACTATATTATGCTAGCCGATTCTG
+TAAATGTAGTCTTTACCGAGAATTGCTGACACTGATTTGAGTGTAGGAGGTCCGGTATAC
+ACTTATCATCAACTTATTCCTACACTCGGTTTTCAATAGTTCGTAGCCCCAGGTTGCATG
+AATATTATACCTCGGATAACACCTACTAATCCGTCCACAGCCTAGCACTTACTGGCGATC
+AATGGAGCATGATGTACTTAGGGGACGGTATGAACATTCTTAACAGTTCCAAATGACCTG
+TAGCAAATACAATAGCATCTTTGTTTAAGCATGGTCCTCTGCGGTTTGAAATGTCGCTAA
+TCTAGTGATATTCCTTGTAAGCCACTGTTACTCTAATTTAGCCCACTCCAGAACGAGTTT
+GTGTCCATGAAAATGTAACTCCCCAGACATGCAAATACGCCTTATTGCTGAATATCGGAA
+CAAACAAAGTCGTTATCATCCTGAAATCGACGACAAGTACATATTAAAGGTTTGTTTGGC
+AAAATAGGTAGCAAGTAGGATGTTCATAACAATTAAAGCGCGTAACTCCTAAATGTGCAT
+TATGCGCCGAGGACCGATAGCTGACGCCGCTCTAGCTTCTATTGTTCCACTGTACGGTAC
+AAAGATTGAATACGGAAACAGAATTCGTCAATTTGTTGAATTATGTTCTATTCGTTTTAT
+CTGGTATATTTGTTACCTAACGTATTTAGGGAAAGTAGCTTCATGAAGAAATCTAATCCC
+TCGCGTGACGAGTTTGCTGTGATTATTATGCGACCTGACTCTTGTAGTGTGGAGTTCGTT
+GTCGTATCTGTACAAACTGCCGACACGTAGACAGGCCTGTCTAATAAACCAGGGACCTTT
+AAGCGTCTTTGTAATTAAGTAAGTACCAGACCATCCTTAGATCAATATGATGCGCAACCG
+GACCGGATCAAATGTTCCAAGCTCGGTAGGTTATCCTATAAGAGCCTCAGCAAAATGATG
+TAAATTGTCAGCGTGTAGTACGGAAACAGATCACGGTATAATCAAGTCTAAATATTTAGC
+CCCGGTCTTGGAATGGCCTTTTATGCAACCAATTTGTGGCGATTAATTTCTCAACAGTAA
+GACAGAGAAAGCTAGAGAAGCTGGTATTATTCTGCATGTTGTCGAACCAGCTGTGTACAG
+TCAACATTTTGCTATTTACTAAGTTGAAGCTTTCGGTTTCATGTGAAATATCTGGCCAAA
+TCGAATGCACCCTTTGACCGGCAGTTTTCATAAGCCACGTGTTTGCATTTCTCTTTAACG
+CATTGAAAATCACCGCGAACGACCTCACAACTGTCTAGCTTACCGATACGTTAGTGGTCT
+CCTCGCAGAATCGAACGAACCCGAATAATATGGTGATATTCTTTAACGACTGATTAGGGT
+CTTATTCGAGATTTTCAGTCTTTAAGCGTGAGCAGCGTGTTAATCACCTAGCAACATTAT
+AGAAAGGAGAAAGGTACGAGCAGTTTAAAAGTTACTTCTAATTTTAACTATTGTCCAACT
+AAGTGTAGATTATTTAGGCTTGTGTCCAAGTGAGATCATACTGTTTTCGTGTGATAGGTA
+TCCGCATCATAACTAGTTATATTAGCACCGTGTATGAAGAAACGGTGGACCGTAGCACAA
+CTCATTGTTATTTTGTCCCCTCTTGGTTTATTGGATCCTAGATTATATACGAATAGAGCC
+CCTTTCGCAACAGCATCAGAATCAGACCTGCGCTCTCGACTGATAATAGCAATTTGTTAA
+GAGCGGATAGACGCAGAAGAATAACATGATTTGTGCACTTAGTCCAGTCCAGATAAGAAG
+TTGAGGCATTGACTTAACTTTTCATTGTCCGCTTGCTATCCCCACGATCCTGCTAAACTA
+AAAGCTTTTGGCGCGGAAGAGCCGTTATGGAGGTTCGGCGAAATTGTATCACTAGCTAGA
+CCATTTTCTGTAGGCTTTTAGCTTGATCGACGTAAATTCGATTCTATATGGTAGAAAGGT
+ACGACCGTTATACGCTCACGTACAGCCTAAATTCACTTGTGGAGGCGATATAAGCTAATA
+AGCGGTTCATTTTGAGGAACCGTTACTTTGAGATTCACTTACAGCAACTAAGGTTGTGTT
+ACCGTTTCTTCTCAATTTACTGCTGGAGCGGCTATTATGCGTCCATCACCTTCATAGCCC
+TAGTCATCAAGCCCATAGAGGTATGTTCGTGTGTAAACGAATTCCAAGACTAATTGGTGG
+AAATTTCAGTTTGGATTGAATGAGGCTGATACTTCTATACACTTAAGGGTTCCCCGTAAG
+TATATTGCCATAAGGGAGTAGTAACACTAAGGTTGTGAAAATATTGCACGACGTAGGTAT
+TCTCAATTTCCTTCTAATTCTGTAGGATTTATGTAAGGCGACCGGGACTCTATTGTTTTG
+TCTCCGAGAGTTTCTTAATCAATTGTCAGGCTAGTAGATCAAGTGTAATAAATGATTAGA
+GGTCCTCATTTGGAGAATTTATCTATATCCTTGGTCGTCCACGCGGTATCGGAGTTGCTA
+TACAATAAGTTGGTTCCAGAAAGCGTCTTAATTACATACTCTTGGTTTATCAACGAGATG
+GTACCTAATACTCTCCTCTCAGTTCAGTAATAAGGACCGTTAACCGCACAATTGCATGTC
+ACCATGTAACACATCCTAGGTTCAGTGGTGCAAACAAATCAAAGTCGTTCGATGTCACTA
+AAACATTTTGCTTAGTAAGCTCACTTGGTTATGCAATATTCTTCACTTCCACAAGTGACT
+CTACTTAAGGCGACGCACCTCCCTACAATTCGCATACGCCAGGTACACACAGCATGGAAT
+AGTGTAGTACCTACTCATGCGCGAACGGTCGCCTGCAGAATTCCAACATGGAGGTCTTCT
+GGCCTAGTGCTTGTGCTTCCGGGATACACCGCACTCATATCACAGTTTTCCCTGGCACAG
+GTTATAGTCCGCTAGCGTGTTGAAGCTAGTTCACCCTTACTATGATCCAAGAAAAGCTTT
+TCGGCCGGCCATCCTTCACCATACGTTTCGGGGTCTTAGTTCATTATCAGAGTCGGTGCC
+ATTGTTCCATGTAGGTACGTGGAGGAAGTAACTCTTGATATGCTATACGTGTAGCATACT
+ATACTCCAGAATCCGTCGCAACAATCCCTTTATCTGCCCCTTTATTTACATTCCCCGCAT
+GTTTTGATTACTTAAATGTCGGGTACTGCTGGTATACACCGTATGCACCGAAAGACAGCA
+ACCCCTCAAAGCTTCGACGAGTTACCTGGTGTGAGACTATCAGCTTATAACCCTTACTAA
+CAGCAGTAGACGAATTCTCCTAGTATAAAGTCAATTACAGTTGACTAAATTCGAAGTAGC
+CGAGTGGGTCTCATTAGACCCTACATGTATCTCTTGTTTTCAAAACGGCTGTGAAAGTCG
+GAATATTATGTGAGTATGATTCACTCGGCGGAACACTCAAACTCGCTGAATCATTGATTC
+GCCGATGATTAAGCCGACCCTCCCAATTACCGCTGCAGCACTACAATCTCAATTTAGGTA
+TACGGATCTAGGTCCGTTCGTTACCAGTTACCAATACGCAACCGAGCTCGAAGAGAACAC
+AAATTTACGAAGCAAAATTCGGAATCAGGGTATCGTGCAGAATGGCAGGAGAGCTGGAAC
+TGTTGTCAGATTTCCCTCTAGTAATCGTACGAGAATATATTCTATGTCACACATTAACCT
+ATAGGTAAAGCCTCATTATACTCCGTTTAATGCAGACTTATAGGATGCCATGCAACAAGT
+CTAATCGTCGCGAGGACACTCAAAAGGATCAGTGGAAAGTAACACTTTGTGGTTCAATTC
+AGAAAATCAGCTTGTTTGTACCTACAAGTACAAAACTTGGAGTGGTAGAGAGGTCAATCG
+ATTAAGTTAAAAGGTTAACGCATGCGCCTAGTCATTAATTGGTTGCTGCGCAAAATAATG
+CATGCGTAGTAAATCCCAGCCCCAAGTCGAATAGATTATTAACGCCGGAAGCAGCCATCT
+GCGGAATCTTCGTTGTGTCGAGCGTCAAACGTTGCTCCATGGCTCCCTCCCTTTATCGGG
+TTCTCTCATTGAGTCCAACTAAACATCTACAAAAGAACTTTGTTATGTGATATAGCTTAG
+GTCTAATCTTAGGCTGACATGCATAACGCTTTGTCGAGGTCTATTAACATAGCCGAATGC
+ATGCAAGCTTTGATGGATATTAACTTCCCAATGTCTAAGATTAAAGAAGAGGACACCCAT
+TATGTCAATCATCTAGCTAAATCGAGCTGCGAGCCGGAGAGTAAACAGTTTCCTTTTCTT
+CGGCGGTTATTTGAAAATTCCTTTCTTATGGCAGTGTTTCGAGCGAGCAGTATATTAGAC
+CCAACCTCGATAATCGTTAATCACATAGCGACTATGATAGTATCATTACCAGCAGCATAC
+ATAAAATTGTAAAGTGTGTTACTGTTTGCGTGGGTGATTATAGTACAGTCTTTTGCAAAT
+CTACGGCCCTGACAGAACTTCACATTAAAGGCCATCCACAGAACAATGGACAACGTATAA
+AACCTAAAAGGATATCGTTTTCCTGGGGTTTTCAGTTGTTTTAATGACCGGTAAATTTTC
+TTACCCTATTGTGTTTCCTTACACAGAAATATCTGAATATTGAGGTACCTGTGAACATTA
+TCATTCATACAACATATCCTATCGCCCATCCTGTGCGGCGACTACTCCAGCACTCACTAA
+TTGTTAATCATCTCATACAACTCGTCAGAATTAACATTACCGCAAACTGCTTACTAGCGC
+AATCAGGTCAAGAGGAGGACGGCTTTGTCACTTAAAAGAATAAGGTGTAGCTGCATAAAA
+CAATGTGTATCTTCTGAGCTTCACAGCCGTGGGCTATCTATGGTTCCGGTCCTGTTGATT
+GCTCCCGATGTTGAACAATACTTTCCACTTTCCGTGACAGAAACTTTAGAGCAAGAGGTC
+AAACTTTACCCAAGCCCATAGGTAGAAGTTACGCGCGCATTGACGTTTGATCAAGGGACA
+GCTGTGAATATCCGTCCCACGTAATCGTGACTTCTCATCAATATTATATTACTGCCGCTA
+ATCAACAACTTCCTTGTTTCGACTGAAACGATTTTAGTCAAGTCGAAGACCTCATACGAT
+AAGATTTGCAACATGTCTAAAAGAGAACGGGAACTGGCAAAAGGCTTGGTAGATCCGTCT
+ATAGCGTAAAACTGATTAACCCATTAGGTCTGAATAACTTTACACAACCCTCCGCACTGT
+TAAATGACGGGCTTTGCTCTGTTTTGACACATCAGCTAGAAACTCGCCACGAAGGCATAA
+GGCTCCCATATAGCGTAGCTGACAAACATATGAGGTGGCTGCATAAACTAAATTGAGGCT
+CGCGTTCGGATACTTGCCCATGTAGCAAGTCTTGGCAACCAACTATATAATCATCACGAA
+TTGAGTGCTAAAGACATGCGAACAGTTGGGGCTGCTATATAGTATGACAGATATAGAAAT
+TTTATAAAATGTCGTAGGAATCTGGAGGCCAAAATCATTAGACACTCTTGTAAAAGGTAT
+GGTAATGTGTATGACCTCTTGGCATAGTGTCCAATTATTCTCGGTTTACTCTCAGAGACA
+CAGTCATGTAAAAGTGGTGAGGAATTACCGCCGTGTTTTGCCAACCAAGAAGCATTGAAC
+AGTAGATCAATAATGATATTCGGTAGCGTATTTACGCTTTGCGGTTTTCAGAAGAAACTA
+TCACAATTGAAACTCTATTCTTCGCCTCATTCCGTACCGTTAGGAATGACTCGAATCGTA
+CTGTCTGCCGCGGGGCATAGTGTATTGCTCCCCACCAGGTTCAGATAGTTCGAATCAGTG
+CGCTGTACAATTGCCTTACGTGTAGATTTGCATCACCGCTTCACGTAGGCACCCAGAGTG
+CTCACTAAAGCCACTAGAGAGATAGAGTTAGAAATTAAGTATCGGTTACGCCCCTCAGAC
+GACATAACTCACTTCTACCGAATATCCTTTCTATCTTGGATACTACTAATGCTTCCGTTC
+ACGCCGCAATCATGTGGATCCTCCAGTAAGCAGGGTGCTGTCATGACTATACAGTACGGA
+TCCGTAAGCATTTTGAGGATGATAACATAGGGTCGGTTACTGTGGATTTCCGTTACTTAG
+GAGAGCAGCTTTAGCTGACTTTGCTGAGGCTGCGCGTGTTAGACAGCAATTTACGAACGG
+CGCACTCTATAGCAGGCACTCACAGTGGACCAGTAGTCCTATTGCAAGAGTTCATTATGG
+AACATTTTAGTCCTCTATCACACGGACCATTGCAGTAGATAACTCTAATCCTATGTCTTT
+ATTTGGTTGCCTGGAACCCCTTACCACTAGACACCCCAATAAGTAATCTTGCTTCCATGT
+CGAATTGATACTCATCGAAAACATATAAAACTAATTATGCTTGTGTTCCTGTGGTCTGTT
+ATATAGAGGCGCCCTATTGGCCGCGGGATAAGGATCATTTTGGCACACTAACGGGATCCT
+AAAACTTTATCTTTCAACGACTCCTACATGCCTTTTAGGTTAGTACGCGAATCGCCTAAC
+AAGCCAATGGGTATTGGAGAATTAGACAAAATGGTTGAGGAATAAAGTGGCGCAGGATTT
+TGTCCGAGAAAGGGATAGCAAACGGTCGCAGGCAGGAGTAACAATTTTCAACCGACCTTA
+ATAGAGCTCAAAAGCTACCGGAGAAAGCTTCGTCTATGCTTAATACATATGCTAACCTAT
+GAATTTCGTAAGCGTAATATAAACTTATCAGATATTTTAAAAGCATCCTATTCAGTCGTA
+CTTTTGGCAGGAAAGGTCAGGCGAAACAGAGTCTCCCTGCGGAGGCTTTTAAAATAAATA
+GCGGGCCTAGCATCGATTCTAAAAGACGACCCCAGGTGCGTAACCGTGCCTCCCCAAGTC
+TTCTTTTAACAATTACCTAGAGAACGGCGTCAGTCGCGAATGACCTTACGAACGTTTACG
+CGGAGCCGAGTAAGATTAATAACTGCTTATTGATTTGCAATCGTTTGATACGGGTGGCCC
+GAAGCTCAATATCAACATAAATAAAATTAGTCGGAATGGTCGCTTAAATCGCGCGCTGTC
+ACTGTCTTCATATGAGGGAGTTGTGTAAGACTGCATTGATATATAGGTATGATTTCGGTT
+TAGAACTTTGTCTGTTAGCAACTCCGCATGATTGAAGGAAATCCTCGTTGGTAAGATCTC
+TTTAGCATTTGCACAGCTGACTCTAACAGCATAGTATGTGATCGTATTATGTCTGCAGTT
+TGTAACACAGTGGGCGGCATGGATGGTACTTAATGGACGTAATGAGCAGTAGACCACCGG
+TGTTACCTAACCATCATTAGAGTAGGCGAGATTGCGCTTGTACGACTTATATATAAGGGT
+AACCGGAATACCGTTCCTCTTATCAACAACAGTTACTGGTCTTAATTCACATCGGATATT
+GCGATCGCCAAGACTATCCCGTAAGTCGTAAGCTAACCAACTAGCGGTTAGGTTTATTGA
+GGTTTTGATGGGAACTTCTCAGACACGTCGTCAACTACCTAATTTCTTGGATGGAGCTAG
+GCTAACTGTCCCAGAACTTTCTGACACTCGAGATCCTCTAACTAATTGGAATCCAGGAAT
+TCCCTTATTGCATCGCCACAAACGACCATAAATTACAGCATGTTTCATTGTCTAACGTGC
+CTATCCACGAAATTGAATTCGGTTCACATTATATATCCCCTTCTACCGCTAATTTAATGT
+TTAACGTTGATGGGGCAAAGCACATTCGAGAAGTACCGAAAAGTCTCAATCCAAAGACCG
+GAGGAACTGGCTTCGGTAAGAATCGCGAGTATCCTTGGATGCCCTGCCTGATTATAACTT
+GTTCCATGTAGATAGGCGTAGCTAATTCATAGCAATACAATAAACGAGTCAGAACTGTAG
+TCTAACATAACAGCCTGCTCTCCAGGTAACAGCCCATTATTAGATATAGTATCACGATCG
+TCGGTTGTATTAGTGGTGATAACTATCGATTCTGCCACTAATAGAATGTGCAGAAATAAA
+GTATCTGAAAGAAAACGAAGTCACAGAGAATAAAGCTCACTTCATAAAAGTCGGTTGCAG
+TAGACGCATATCAATTTTCCCTGCTGCATTTTAGAGTTCGGAATAGTTAAACATAATACT
+GGAAGCGCTTCCGGCAATCAGGAATAACCCCATATAAACCAACCTTTGTTGCTATTGCCA
+GCGCTATTCTCGTCAAAATTTCTCCCTATGGTCTTCACATCATGCATCACCGGACCCTTT
+GATAGACGATGACCCAATTACAATCACTCCACGGATGAGCATCCCATTTTATACGAGGCC
+CACTGGAAACAATTGCAATCGACGTGACCAAGTAGAGGAGCGTGCTCGAAAGGTGATGAT
+TGCCGAATTCTAACAAGGATACTATAAGCCACGGAACGCTGACGTTGAACAGACCTGGTC
+TCCTGGGCACTTCGCAGCACCTCAGTAGTAATTCCGGTAGATTAGGACTTAGCATTCCGT
+TGATCTTACAGGATTTATAAATAAGGAGATCTGTCTTGTTTAATTAGGAGGACGCTTTTC
+CCGCGTAAGTACGGGAAAACGTTCTTCTGATTTTGTTTGCCACTTGACATTGTAGCTGCT
+AGGAGAAGGGATAATATCCGCGTTTTCTTTTACCGTAACGTCGGAGCATACCATGGTAAT
+TGTCCGTGTCAAAACTAGATATCTAGGTTGCAAAATTCAGTCAGTAAGTCCTGAGGCCTT
+CCGCATTATTAATTCTACAGACATATGAATTTGCTCCACCGGCTAGCACAGTCAACTCAA
+CCCACGATAGGGGAACGAAATCACAAATAGGTTCACATGGTCAATACAAGGCAAACCATT
+CCCCATAACTCACGCACTGACGGTAAGGCCATTTCAGGTCAAGCGGTGAATGCTGTGAAA
+AGCAGCTCGACCACCTGCCGTGGATGGCAAACCGATAACAAAGGACTCCGATACTTCATT
+TGTAAACGTTTGCAGTGCTGACGTAACTCATATCTACAGTCAAACCGAATGGTTTGATCG
+GCATTATGTAAAGGAATCGACACACGTTGCGTCTTCTAGATTATTACACACCTGTCTGCG
+ACGGATATAGGTAAATAAGTCAGCCTCCACTCTGCAGAAGATACTAGAAACGTATCAGTA
+ATAGCTATCAGGATTTCGCCATCCTCGCACTGTGCCCGGATATCACAGCAAGATTCTAGG
+ATGGCACTTGTGTGACTAGAGGTTTTACTCGTTGAGCCATTCTTACTATAGGCATGGGAT
+TACAATGTGCATGTTTGTGATGTTATCCCATATCTTGCATGTATCAGCCTACCAATTAGA
+CATATGACTAGATGTAGTCGATCAACGCAAGGGTGCGGACTTTGATTCCTTTTGAATTGA
+AGTCAACTCAGATGCTCCTTAAGACGTTTTACAGTAGGTATTTTGTGGTACAAACCAGAA
+CCAGTGCCAGTCGGTAGTTATTGTAGTGTGTTCTTAATACATATTTGGTATTGGAGTTTC
+TAACATTTAAAAGGAGCCTATTACACTTACTTAATTTGCGTCTATATTTCTGTTACGATA
+TGTCGTCTGTCGATTTTACGAGTTTCATACGTGCGGGTTCCCTGTTCGCAATGGGCCCCT
+TGCTAATGTCCCGCATCTTTAGGATGCAAACTTACTCACGCCTCCTTTACCGAGACTTGG
+TGGGAGAGAAGACTCCTGTAGAATCCCGATCTGAATGGTTTCAGTGTAAGGGTCCCTTCT
+AGCCATATCATTGAATATTCTTGTACTTTAAGTAACTCGATCCTACCAGTACAATTCTAG
+GTTTGCCTTATAGCCGGAATGAGTATCAGCGTCATTCACCCCGGCCGGATATTATTTGCA
+ATGTCAGGGACACCCAAAATAGACCGGTTAGAAGGCATATGCGATGAGAGTTGGTGCCTA
+AATTAAACGATACAATTGATATGACAAGGACTATACGATGAAATCCATGAGATAATTATC
+GTAACTCGGCCAACCTAAAACCGTGCAAGATAGGAGCGGTCCTAGAAGTACTATCGACAC
+CTTAAATACTCACTTGAGTTTTCCGATCCTATAGTGCCAATCATATGGCGCAGGAATATT
+ACAAACTAAGAAAGTCAACAAAAGATGTAAATTGCAACACCTGGCATCGGTGGGGTTGTC
+CCCTTAAACCCTGAAACCAACTGTTATGCTCAACATTATATCGAGGCTAAAACGCGTATC
+GTGGCACATTAATAACGATCACATAAGCTTTGCGGCTAGCAATAATAATTTAGGACAGCT
+TAGATTTTGACCCGTGCTAATCCTCAGTATGGAGTAATTTTACGGATCTCTCGTTGTAAC
+CGTCCTCAGTCGTGTACATTTTAACCTTTGTAAACTAGTTTACGAACGAGTATTTAGAAG
+GTCCGTACTCTCACCCAACTGACACATTGTACTAGCTCAAGATCGCAAACACTAAGGGTG
+TGAGTCGCGGGATAGCGCTTAAATATGACTGCTAATGGTCAAGAGCACGCGCATAATATT
+CCACTGGTTCTAGGTCACCACTACGGTCAGACGTTGACCTGCATGCCCTACATCCGGCAC
+GGGCTACTAACGGCCTAATATTCTTTGAGCCATATCCATACTCGTCTATGCATATTCAGG
+TATACGGCTATAGTGCGTTATTAACTTCGTCGTGATTAAATCCTTTAATTGTTCCATTAT
+AAGTATACATGCTTAGATGCGTGAACTTGAGGGATATCGTTGCTCTAAAGTTGTCTTATA
+GACTAAATCTAAACAAGCCGTGCAAGACTACTTAAATTACAAATCTTACAGACATCTCGC
+CACTGCGCTAACACTAACAA
diff --git a/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa.amb b/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa.amb
index 0719bfe..5d6da8b 100644
--- a/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa.amb
+++ b/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa.amb
@@ -1 +1 @@
-19800 1 0
+20000 1 0
diff --git a/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa.ann b/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa.ann
index 01f4a1e..a633aab 100644
--- a/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa.ann
+++ b/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa.ann
@@ -1,3 +1,3 @@
-19800 1 11
+20000 1 11
0 chr_test (null)
-0 19800 0
+0 20000 0
diff --git a/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa.bwt b/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa.bwt
index 7b2e7ab..9ed4852 100644
Binary files a/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa.bwt and b/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa.bwt differ
diff --git a/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa.pac b/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa.pac
index dd39245..d99d805 100644
Binary files a/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa.pac and b/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa.pac differ
diff --git a/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa.sa b/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa.sa
index 76e12a6..b19e11c 100644
Binary files a/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa.sa and b/pipelines/nf-atacseq/tests/data/bwa_index/chr_test.fa.sa differ
diff --git a/pipelines/nf-atacseq/tests/data/chr_test.fa b/pipelines/nf-atacseq/tests/data/chr_test.fa
deleted file mode 120000
index 60a78a3..0000000
--- a/pipelines/nf-atacseq/tests/data/chr_test.fa
+++ /dev/null
@@ -1 +0,0 @@
-../../../../tests/shared_data/chr_test.fa
\ No newline at end of file
diff --git a/pipelines/nf-atacseq/tests/data/chr_test.fa b/pipelines/nf-atacseq/tests/data/chr_test.fa
new file mode 100644
index 0000000..182b3f7
--- /dev/null
+++ b/pipelines/nf-atacseq/tests/data/chr_test.fa
@@ -0,0 +1,335 @@
+>chr_test
+GAAAGGCATAATAAGTAGCACGTACTAACGCGTCTTCGCTGAAAATAGTTAACGGAGATC
+GTGCGAATAACCTGTCTAATAGCTACTAAAGCTATCTCCAGGTAGATTCCATACCTGGAG
+TGTATACCCTACCATAGGATTACTATGATCGTTAATGAAAGACCAAGAACTTGCAATTTG
+GCATTCAATTAACTCTACCCCATATATCAGTTCCTGATCTTGAGTCACAAGGAACAGGTG
+TCAGATGTTGATCCAAACCCTACGGCGACTGCAAATAGGAGATCCATAAGGAGTTAACCT
+CGAATCCCCAAAGCTGACCCCAGTCCCCAGACCACTTCAAATCCAGTCTCACACAATGTG
+TTTAGACTGGGTAGTTCGTTTTATCGCGTTAATTGTTATCCAATGTCGGAAAATCATGAG
+TAGAGGATACTAACTCGCGCCGGTCTCGTAAGGTGAAAATTAAGGATTTATCGGCGTATG
+CCTGTGAATATGTATAGATTAGATATATGTGCAAATCTGGGGCAAAAGTAGGAGGACCAA
+TGCTGAGGAGCGACGTTTTCCACGCGTGCACTTTGACCACATGTACAACTCGAACAGTGG
+GTCAAGTGTTTGTGAAAAGGAATGCTAAAATTACTGACTCTTTAACTCTAGAATTCAGGC
+ATTTCCTGGGCAAGAAAATGTAGGTGCGGGCTTGCCAATGTAAGGCTTAATTAACCTCCG
+AAGTGCAGGTATTGCTGACCTTTTCTTCGTTATGGGATCTGACGAATTACCTACTGTACC
+ATTCTCCACTCTCATGCTATTTTAAGTAGAGGCTGCCTATGCCTTTGTGATCTGGCCCTT
+GGCAAGCCGTAGCTGCACTTATTCAACGACATAAACCGATTGGTACATTATTCTCGATGG
+AGTCACGTGGGGCGCGTTTGATGAATCTCCACTCGTACACCGCCCTCATTGGGCCAAACT
+CAACCTTACTTACATGGCTGATATTCATTCCAGTCTTAACTGGGAGAATAGAACTACACA
+AAAGAAGATAAGTGTGTATCAGCTTCATTGTCAAGAAGTTCTTGAGCGGGATATTTATGT
+ACACAAGCTGTTATGGCGCGTTAGAACTGTCCCCGGACCAAGTTACTTAGAGATTTGGTA
+AAGGAGTTAGATAGTGATGATAAATAGATGTCCACAACCTTGTAATCGCCACAGTTTTAT
+ATCTGCCAAAGGGAGTGGTCTGGCGAATTAATTTACACCGTTTCCTCGTTAAACTGTAAT
+TTATATTGGGAAGAGGCCTGATCGTGCTTCCGCGGTGTTTAACTAAACAGCCATGATACG
+CATTGATAGTTTCTCTCCTATTCCCAAGCTACCAGACATCATTAATACTACCGCAACGAG
+TAAACTGTAATATCTACGATAATGATGACATTCTTTGCAAGTGGGGTATCAGTGGCAGTT
+AAACTCTAGATGCTATCGCTCTTCTCGAGCTTAGTGTGTACTCACCAGTCGCAGGAAGTT
+TGGCTGTTTGAAGTTTAATCACTACTCTAGCTTATCCGCGCTAAACATTCTGATCGTGCA
+CGTGTCGGACTCAAAATGTCCCAGTATTTACAGGGCTCAAGTGGTGTGACTCGTAATTAG
+TGGCCATTTTAAATTGACATTTGTTTTACTCATATCGTTCTCGGTTTATATGACGACTCT
+CGATTAATTTGTTGACGTTCTGTCTGCGCGGATCGGTGGAGGCAGACAATAGTGCCGAAA
+TGTTACTTGGGGAATACTAAGTTCCAAGTCCCCTAGTTATATCGAGGAGTGATGAGATCT
+CCTACTGCATTGCCACACCTTCCCCATACACTTCCTAAATAAGCTGACCCTAGAATAAAG
+CTGAGGAATTTCGTACTGAAAGGTTTTGAAGCATGATATTTATTAAGATCTTTATCGTCG
+TATACCACATGGCGTCTCCTGGTGTATTGAAATGTTCATACGACTGCAAAAGGAGTAACA
+TACGTGGTTAGATACCCGTTCCGGTTATGTCTGCCTCTAAAGCCAGAAGGCAGGTTCTCA
+CCACTAGACTGTTTATTACTCCTTTAAACTTATTCTGGACCGTACAGTCTGAACCGGTCA
+GATTGGGTTATATACACGCCAAAATCATTTTCAGCGCGATTAAATTGTCATAACCTAACC
+TACTCGGGTAAACTCTGACGTCATCTGCTGAACTTCTGGAGCGAAGGGTAATTAAATTTA
+TAGTTTTACCCTATATTATTTAAAGGAATCTGCTTCCCATCATCCTGTTATCTATGTGTC
+TGTTGCCTTGAGGGACTTTCGTCTCTGAGGTGACGTGCTAATTGTTTGGTTAATCACATT
+ATTTGTTCACGGACAAATCATAGTAGAGTGAGCAACATTACTGGGGTCGCGTGAAATAGT
+TATAGGGCTTATTATAACCTTGTCTAAGTATATGGTAAGCTCAGTCACGTCTTCTCGACG
+TGGAAAATATTGAACCGACGCCCACAGCGGTTATTGCATACTCTAGGGTGTATATAACTT
+TTGAAGTACTACAGAGACAGATCATTGAGGATAAGAGCCTAATGATCAGGACATAGTGGA
+TGCAAGGTCTAAATGGGGCGTTTGTACCTATGTCCCACTTGGCGAAAACTGTTGATGATT
+ACTTGCGAGGCAATTGTGGAGGACTGGAAGACGACAAGTATTTTAATGATACATTACCTC
+GTTTGAATTCACCCATACTTAATTGTGTGACGAATATCCCAGCGATATACGACCTGTCAA
+ACATTCAATCGGTAAAGGAATTTCATAAAGCGACTAATTGACATTGATCAACCACTGGGA
+CAACTACCTATATCTAGAAAACAGATTTAAAACTGCCCGTTTCTTATACGACTGCCAGAC
+CACACCTCCAGCGCAGCTTACCTTTAAATACAAGCCTAGCGCCCTCTATAACCCGACGCG
+AGATGAGCCTCCAGCCATCAGACACAGGCTAAAATTGCCTTTATCGGAACTTCAATGTCA
+GGTACACAAAAGGGAAAATCATTTGGAAATACTTTGATACTTATAAAGGATTCGTCCTTC
+TCTACGTCCGGAGACCCATCTCGCACCATTTATCGGTTTAGGCCTAATTTTGAAAGGACT
+AGCCACTATGACACTCATGAACGGCCTATTACCAACCATCGACTGAATGACGTACGGATA
+TCCGGATAGGACGGAACTCGTTTATGCTATGCTGGTAACGCAGCTAGCCCGGGGCATTAG
+TAGATGCGTCCCAAAACGAGTATGTGTATCTCGCACTCTTACAATTCTTGGTGAGAAGAG
+TGAGGTCTAATATCAGGAGTATGACTTGGTCCTCTACCTAGAGGATGACATACGGAGTTT
+TAGGTGGAGACAGAAAATTAGTATACTAGCCGAATGAAACTTAAATCTGAGACGATTGCA
+CATCATCCGCAGACATGCGATTAGCCACATAATGGGTTCGTTGAGATGTCTCAGACCCAT
+ACAAGTATCTCTATGATTAAGGTTAGCTAATTGTGGAGATCCTTGAAAGGAGACTTGGAT
+CCGGTGCATTACCTTCATGATGCTTCCGACCTATGGTGCGCGAGTTGCGCTGTATTTGTG
+CACCTAAGAGAAACGTGACACGCGTAGCAGCTCCTTAAGGCCCGGGTGGCTAGAATTTTA
+GATGAATACGGTTTGTAAATTTAAATTAGTCCCAGTCGGCGTCCTTACCTCTACATCACT
+AAGGCTATGCGGCGATTAACTTAATGTAGTGGGGACAGTAGTTGTTATCTCAGCCGTCTT
+AAGTCTGCTTGTAACAACCCCTTTAAGTTAGAGCTTGTGTTTTAAAGTCAGCTTTTAGCC
+ATACAAATAGTGCTTCTGTAGGTTTTGCCGATTACGCGTTATATAACTTTACTGTCCATA
+GTGCTTCTTCTTGTAAAGAATGAACGTTAACAATAGATAAACGTAGGAATCCACGCCAGA
+GTTGATAACTTAATGAGTATAGCCGGTTATACGTGGGGAATACACTAGGTAAGGTTAGAC
+TTAGGTGTTTATTGGCGGTGAATTTGGACAAACTAAAATCGTGGCCGTAGCAAGTAAAAT
+CGTTGTGAAACCTCAGACTATAATCCCCTGCTGGCTTGAAAGCGATCTACAAGCACTTCA
+CGCTAGCAAAGAACGGGGTATGTCCCTCCAATACTTTTGACGTGAAGTGATATGTTAGTC
+AAATAAAATTACACATCCTGGTTTTGACTGTTTTCAAACCATGAGTGTGCTAGAACTGTC
+AAATTAGATCTGCTAAGGCGAAAACTATGAAAGCTAAGACAGCTTCTATCGAGGGTTGTT
+TCTTATACCTTACCTATTAATTTTAGTTATAGCCGAGCTCAAGGAGAAATAAAGGAATTT
+CCTCTCCAGATACCCAGAGTGATGTCTGTTGACTAGACCAAGTAAAGAAGTGTAAAGCCG
+AGGCAACGGCTAGTACTTTGAATGACCTAATATAGTAACGAGGTTTTGTGATACACATAT
+CGTGATGACATCACATCTTGCAAATCCAGTATAGAGTAGTTGCAATTACTTTCTTGTGGT
+AGCACTTGCGTCTTACACGATTCAATATGACATCGGCACGTCGTGTAAGTCTCCAGGAGT
+TATATAAGTTGTAATAATATATGAATTGAGGAAGTCAGTTTGATCGCTAACATGCAACCC
+CAGATAATATATGAGAGGAAAGGAGATACGCACGATCATCTATTCAATTTATTGACTCGC
+CCATAACGATCGGAAACCTTAATCCTGTACCACCTTCATCGGCTTTCCCAGAAGGATAAG
+TGTTGGTCTAAAGAATGCGACCCTTTATAGTTGGGTCGTTCACTTGTTGATTTCTTGATA
+CTGAGCGATTAGGATAGCCGAATTTTCTCTTGCTGACAGTTGTGAAAGATCTACAGTTAG
+ATGTCAAGACGCTCATAGGGGATTCATTTATTTAGATTGGAGGCTGCCAGTTCTATTGTA
+GGCAAGACCCTTTGAAACTTTAGTGGAATTGCCGTGCTTGTGCTGTTAGCCTCAACGCTT
+GCGGTATTATCATAGGCTATTACGTGACCCGAGTGTACGGATATGTTTCTAATTAAAAGT
+ATTAGAAAGTTATGAATAGGCGGTCGGTCGTACCTTGGTAACGCTGGGCTATTTAGGAAC
+CTGCTTTGTCTTCGGTGTAGACTTGTTCACAACGTTGACCCGAAATTTAGTTCTCTCTAA
+CTATTTAGCTCCAGTTTTGTATCCACGAAAGTTCAGTTGGTATTTTAGTCATTTTCTGAT
+GAGCCGTACATGCAGCTATGTTTGTCCAACGGTATAACCGAATCAAACAAAGATCAGTCC
+TAACATCGATGAGTGGAATTGGTTGTACACTGCGACGCTCCTAAGTGGGGATGATGCAAA
+TAAAACGCCGGACAGCTCCGATCGCATCGTAAGTTACATTCGATAGAGCGAATATCAGCG
+AGCTTCTTCGGTACCTTCTGTGCATCATGGAATAGCGTAGGAAGGTATTTCTCAAGAACG
+TGCATCAAGTCAGAAATCTAGCATCACTCCGTCTACCGGTAATGTTCAACGGATAAAGCT
+CGGAGTTCGAATCGGTAAATATGTAGGAACGCTAGAGATTCGAGCAGTACGGTAGTGTAG
+CTATTCACTTAGGCAAGAACTATCGGGGACCACTCGCAGGATTCGATACATGATTCCTAT
+AGCATGATTGCGATGCTGTTGCACTATACTCGACGACGCATGTATAGACAATCGCAGATA
+GAATTTAGGTTGCCCCACTACACAAGTCTGTCTATTGTACACGTTGTGGCTTAGAATCGA
+TTACGACCGGAAATAAATATTTTATCTTATTAGCTGTACCTATCTGGCATTTCTAAGGAC
+AATTGATATGCCTACTTATCCAGTCCACCTCAGAATCCACGATCTTGGAATTACCTTTAA
+ACCTGCTTGAAACAGGTCGTGATTCAATCAAATCTATCTGAAGTCCGTGGAGCATTTTCA
+AAACGCTTTGATACCTTTCCGGTGACACAAAAGGAGGAACTAAAAGGGCACATACCCTAT
+GATATAAAACTCAATGTGTCATTAAACAAAGGTATAAGTCTTTCAACTGACTATGAATGA
+CCACTGCACGAGGAGGTTGTTAGAATGAAAAGCTGAGAAGGCAGTATCTCATCTTTTATC
+TGTAGTAGGGTTCTTTCGTCTAACTGACTATTTGAGGCATTATTCTCAGGCTTTCAGTTG
+TGTTTCGCTAACTAGACATACTACGTCTTATGTGAAGCTACGTCTGGTTGTTAAGTTTCA
+ATCGAGTAAACTTTGAAAACGACCTACAGCCTTGACGAAGCTCCCACAACTGTGATAACT
+AGTTCTTGCCCTGCACGCGCGGATTCTCACCTCTCAACAACCGCGTACCCTTCGCCCGTT
+GCGTAAGGCATGTAATCCGCGCTTGAGCCATACCCACCGGCCAGATTAATCAGTCTGAGA
+CGATACGCAGTTATAGCTGTAATGGGGAAATACCCCGGAAGTTTCTGATCCATTAAAACC
+GCACGGATCTCGACGCAAAACTCCATGTTCCAACAATACGGCTTTAGGCAGGTGCCAACG
+TCGACGCTGGCTAAGTAACTTACCACAGAGGATTCTGAGCTTCTTTGCGTTATTAGATGT
+TTCTAACCTTAAAATAGTAAATAGAATACTGTGGACCAAGGCATAAATGCCGTGCTGGTT
+AAAACCAGGTGCATTTAAAGCTCGATCAAGGCCGGTTTTGGGCTGTTTACTTTCTGAAAT
+AACTGCGATGCCGGCCCGAGGAAGATCTAAACTACCAATGAAATTACAAGTGGCTTCAAG
+GCCAAGCCATTTGAGTACTTGACTTATGTGAGTACTTTCCTAAACCATCAAGGGCAGGGT
+TTGTTGCAATCGTATGGGCGTATATGGACAATTGAACGAGGCAATGTAGATGTCCCTCGT
+GTAGGGGTATGCTAGCAACTTTTGTTATTTCTCCAAGAGCAATGCTCGTATAATCTTCAG
+ACCACTATCTTTCGTGGGTTTTCTCGTATTCCGGCGTCGTATAGTATATCACAAGAGCTC
+GTACATTCTAAAATATTAGTAATTTTCAAGGTGTAATTTTACACGATGTTAGACTCGTTC
+TATCACACTGCTTGGTAGTTTAATATGCTGTAGTACTTGAGGATCGTCGGTGGAACGGTC
+CTAGGATCTAAACTAGTGATTACGAACTCTTTGTGTAAAATATGAGCGTATTCGCACTCA
+GTTGCAATTAAATAGCTAAATGATCGGTAAATATCCGGGGTAAATCAACTTGAGTTTAGA
+GGATCCGTCGTTAAGAGATGATGTACATTCGTCGATTTAGGATCCTAACGTGGCGTTCGT
+ATGAAAAGAGCTGAACTAAATAGGAAAACGTTAACCAGTGACTACGCCCCAACCATTGCA
+AGATGTACCCCAATGATGGTTTTGGTATCGAAACTTCTCTTAATTGTGTTTCTTAAGTAC
+TGGCAAAATTCGAGCCGGCATCGTTTGTTGATAGTTGGGTCTAGGATTTTACACCTTGTG
+TTAGCACTGGGCCATTAATTCAATAGTAACAAGAATACTAATTACCAATGTGCGTGAAAA
+TCTCCTTGACTGGTGCAACGTCATTCACAGTCGGATCTCAAGTTATTAGGTGCTAACTGT
+ATACACCAAATTTAGGATAAGAGCCGGCTTAAGGCTAATCTAGACCCAATATTAATCAAT
+ATTTTACGTAATGCATCCACGCGGCGTGCTCTTGGTGAGCAGCTGGGATTAAACGCGTAG
+GTCGAACTATCGAGGGTTTACAAGAAAGCCAAGTGAAAATGAGACTATTGGCCATCGCGA
+GATTTGAATAAATGTCCCTTGGTACTTATACGTTGGGCGAACGGGGATGAGCCAGGCTGC
+TATCATCGTTTCGAGGTAGCTTCCAAGTGGATGAACTCAAAGACTGGCATTATGTGAAGA
+GCATAGCGCTTTTCCCCGTATTATGGCAGCAGCTGGTTACCCATACTTGTGATCCCCGTA
+ATTCTACTGTCATAGAAGGATGACCGAATCAATGAGCCGGGTGGTGTCCAAAAGCGATCC
+TAATCCTTGCTGATTTACCTTGAGCGGTCACGTCTGTCTCAGCGACATTCGCCTTGCGTT
+AGACTAGGCCGTAAGTAAGGAGTGCACTCCACAACGGCGTAATGCGTGCGGCGAGTAATG
+TATTAGCATGTTAACCACATTCTTGGCAGCCAGATCAAAATCACTTTTCATCTGGTTGTC
+TTAACAATCCGATAGAATCTAATGTAGCGATGCGTACTAGAAATAGTTACAATCTACAGT
+CTTGCTGCACTTGCTGCTAATAATGAGCGAGGACCTATCCCTCCTTAAGCAAGTTCCTTG
+TTCCGTGCGGGGAGCCCTGGCGCTAACTCTTTACATGATTAGTATCGCATGTTGTTACAT
+ATATAATAGATTTACATCATTTCAAATGCAATGATTCGTGCTCCTAAAATGAGTCGTATG
+AATAGCCACAGCGTACGGAAACCTGAATTGATTTGTAATTTAAAGATCAACTTAATCTGT
+GTTGATCAGAGCGAGCATTGCAGAATACCCCTGCATCTAGGAATCGGTGCCAGTGTAAAA
+GCCTGTTAGTAAAACCACGACTATGTAGTGTGTACCACACTCGGAGTGCGTCAAGCGAAG
+TCAAACATGGAAATGAAACCATGCGTACGGAAAAGACCAGTGATTTATAAGGACATTCAC
+ATAGACTCCAAAACTGACCCGATGGAGTCTACGCCGAACAGTTGGTATCAACATTTGTCT
+CGATTTTCTGTTGGGAACATCCATCCCTACCCACAACGTACTGGACCATAATCAAGGGTT
+TGGAACAGTACGCTCCTGTACTCAAGAAGTCCTTGCACGAAAGCAATAGGTTGAACTTCA
+TCATATAGGCGATGACAGTGCTATCAGCCGGACTGGCTGTTCTCGTAGAAGTCACTCGAA
+TCAATAAGATACGAATACTCCATCCTGTACGGGGACACTATATTATGCTAGCCGATTCTG
+TAAATGTAGTCTTTACCGAGAATTGCTGACACTGATTTGAGTGTAGGAGGTCCGGTATAC
+ACTTATCATCAACTTATTCCTACACTCGGTTTTCAATAGTTCGTAGCCCCAGGTTGCATG
+AATATTATACCTCGGATAACACCTACTAATCCGTCCACAGCCTAGCACTTACTGGCGATC
+AATGGAGCATGATGTACTTAGGGGACGGTATGAACATTCTTAACAGTTCCAAATGACCTG
+TAGCAAATACAATAGCATCTTTGTTTAAGCATGGTCCTCTGCGGTTTGAAATGTCGCTAA
+TCTAGTGATATTCCTTGTAAGCCACTGTTACTCTAATTTAGCCCACTCCAGAACGAGTTT
+GTGTCCATGAAAATGTAACTCCCCAGACATGCAAATACGCCTTATTGCTGAATATCGGAA
+CAAACAAAGTCGTTATCATCCTGAAATCGACGACAAGTACATATTAAAGGTTTGTTTGGC
+AAAATAGGTAGCAAGTAGGATGTTCATAACAATTAAAGCGCGTAACTCCTAAATGTGCAT
+TATGCGCCGAGGACCGATAGCTGACGCCGCTCTAGCTTCTATTGTTCCACTGTACGGTAC
+AAAGATTGAATACGGAAACAGAATTCGTCAATTTGTTGAATTATGTTCTATTCGTTTTAT
+CTGGTATATTTGTTACCTAACGTATTTAGGGAAAGTAGCTTCATGAAGAAATCTAATCCC
+TCGCGTGACGAGTTTGCTGTGATTATTATGCGACCTGACTCTTGTAGTGTGGAGTTCGTT
+GTCGTATCTGTACAAACTGCCGACACGTAGACAGGCCTGTCTAATAAACCAGGGACCTTT
+AAGCGTCTTTGTAATTAAGTAAGTACCAGACCATCCTTAGATCAATATGATGCGCAACCG
+GACCGGATCAAATGTTCCAAGCTCGGTAGGTTATCCTATAAGAGCCTCAGCAAAATGATG
+TAAATTGTCAGCGTGTAGTACGGAAACAGATCACGGTATAATCAAGTCTAAATATTTAGC
+CCCGGTCTTGGAATGGCCTTTTATGCAACCAATTTGTGGCGATTAATTTCTCAACAGTAA
+GACAGAGAAAGCTAGAGAAGCTGGTATTATTCTGCATGTTGTCGAACCAGCTGTGTACAG
+TCAACATTTTGCTATTTACTAAGTTGAAGCTTTCGGTTTCATGTGAAATATCTGGCCAAA
+TCGAATGCACCCTTTGACCGGCAGTTTTCATAAGCCACGTGTTTGCATTTCTCTTTAACG
+CATTGAAAATCACCGCGAACGACCTCACAACTGTCTAGCTTACCGATACGTTAGTGGTCT
+CCTCGCAGAATCGAACGAACCCGAATAATATGGTGATATTCTTTAACGACTGATTAGGGT
+CTTATTCGAGATTTTCAGTCTTTAAGCGTGAGCAGCGTGTTAATCACCTAGCAACATTAT
+AGAAAGGAGAAAGGTACGAGCAGTTTAAAAGTTACTTCTAATTTTAACTATTGTCCAACT
+AAGTGTAGATTATTTAGGCTTGTGTCCAAGTGAGATCATACTGTTTTCGTGTGATAGGTA
+TCCGCATCATAACTAGTTATATTAGCACCGTGTATGAAGAAACGGTGGACCGTAGCACAA
+CTCATTGTTATTTTGTCCCCTCTTGGTTTATTGGATCCTAGATTATATACGAATAGAGCC
+CCTTTCGCAACAGCATCAGAATCAGACCTGCGCTCTCGACTGATAATAGCAATTTGTTAA
+GAGCGGATAGACGCAGAAGAATAACATGATTTGTGCACTTAGTCCAGTCCAGATAAGAAG
+TTGAGGCATTGACTTAACTTTTCATTGTCCGCTTGCTATCCCCACGATCCTGCTAAACTA
+AAAGCTTTTGGCGCGGAAGAGCCGTTATGGAGGTTCGGCGAAATTGTATCACTAGCTAGA
+CCATTTTCTGTAGGCTTTTAGCTTGATCGACGTAAATTCGATTCTATATGGTAGAAAGGT
+ACGACCGTTATACGCTCACGTACAGCCTAAATTCACTTGTGGAGGCGATATAAGCTAATA
+AGCGGTTCATTTTGAGGAACCGTTACTTTGAGATTCACTTACAGCAACTAAGGTTGTGTT
+ACCGTTTCTTCTCAATTTACTGCTGGAGCGGCTATTATGCGTCCATCACCTTCATAGCCC
+TAGTCATCAAGCCCATAGAGGTATGTTCGTGTGTAAACGAATTCCAAGACTAATTGGTGG
+AAATTTCAGTTTGGATTGAATGAGGCTGATACTTCTATACACTTAAGGGTTCCCCGTAAG
+TATATTGCCATAAGGGAGTAGTAACACTAAGGTTGTGAAAATATTGCACGACGTAGGTAT
+TCTCAATTTCCTTCTAATTCTGTAGGATTTATGTAAGGCGACCGGGACTCTATTGTTTTG
+TCTCCGAGAGTTTCTTAATCAATTGTCAGGCTAGTAGATCAAGTGTAATAAATGATTAGA
+GGTCCTCATTTGGAGAATTTATCTATATCCTTGGTCGTCCACGCGGTATCGGAGTTGCTA
+TACAATAAGTTGGTTCCAGAAAGCGTCTTAATTACATACTCTTGGTTTATCAACGAGATG
+GTACCTAATACTCTCCTCTCAGTTCAGTAATAAGGACCGTTAACCGCACAATTGCATGTC
+ACCATGTAACACATCCTAGGTTCAGTGGTGCAAACAAATCAAAGTCGTTCGATGTCACTA
+AAACATTTTGCTTAGTAAGCTCACTTGGTTATGCAATATTCTTCACTTCCACAAGTGACT
+CTACTTAAGGCGACGCACCTCCCTACAATTCGCATACGCCAGGTACACACAGCATGGAAT
+AGTGTAGTACCTACTCATGCGCGAACGGTCGCCTGCAGAATTCCAACATGGAGGTCTTCT
+GGCCTAGTGCTTGTGCTTCCGGGATACACCGCACTCATATCACAGTTTTCCCTGGCACAG
+GTTATAGTCCGCTAGCGTGTTGAAGCTAGTTCACCCTTACTATGATCCAAGAAAAGCTTT
+TCGGCCGGCCATCCTTCACCATACGTTTCGGGGTCTTAGTTCATTATCAGAGTCGGTGCC
+ATTGTTCCATGTAGGTACGTGGAGGAAGTAACTCTTGATATGCTATACGTGTAGCATACT
+ATACTCCAGAATCCGTCGCAACAATCCCTTTATCTGCCCCTTTATTTACATTCCCCGCAT
+GTTTTGATTACTTAAATGTCGGGTACTGCTGGTATACACCGTATGCACCGAAAGACAGCA
+ACCCCTCAAAGCTTCGACGAGTTACCTGGTGTGAGACTATCAGCTTATAACCCTTACTAA
+CAGCAGTAGACGAATTCTCCTAGTATAAAGTCAATTACAGTTGACTAAATTCGAAGTAGC
+CGAGTGGGTCTCATTAGACCCTACATGTATCTCTTGTTTTCAAAACGGCTGTGAAAGTCG
+GAATATTATGTGAGTATGATTCACTCGGCGGAACACTCAAACTCGCTGAATCATTGATTC
+GCCGATGATTAAGCCGACCCTCCCAATTACCGCTGCAGCACTACAATCTCAATTTAGGTA
+TACGGATCTAGGTCCGTTCGTTACCAGTTACCAATACGCAACCGAGCTCGAAGAGAACAC
+AAATTTACGAAGCAAAATTCGGAATCAGGGTATCGTGCAGAATGGCAGGAGAGCTGGAAC
+TGTTGTCAGATTTCCCTCTAGTAATCGTACGAGAATATATTCTATGTCACACATTAACCT
+ATAGGTAAAGCCTCATTATACTCCGTTTAATGCAGACTTATAGGATGCCATGCAACAAGT
+CTAATCGTCGCGAGGACACTCAAAAGGATCAGTGGAAAGTAACACTTTGTGGTTCAATTC
+AGAAAATCAGCTTGTTTGTACCTACAAGTACAAAACTTGGAGTGGTAGAGAGGTCAATCG
+ATTAAGTTAAAAGGTTAACGCATGCGCCTAGTCATTAATTGGTTGCTGCGCAAAATAATG
+CATGCGTAGTAAATCCCAGCCCCAAGTCGAATAGATTATTAACGCCGGAAGCAGCCATCT
+GCGGAATCTTCGTTGTGTCGAGCGTCAAACGTTGCTCCATGGCTCCCTCCCTTTATCGGG
+TTCTCTCATTGAGTCCAACTAAACATCTACAAAAGAACTTTGTTATGTGATATAGCTTAG
+GTCTAATCTTAGGCTGACATGCATAACGCTTTGTCGAGGTCTATTAACATAGCCGAATGC
+ATGCAAGCTTTGATGGATATTAACTTCCCAATGTCTAAGATTAAAGAAGAGGACACCCAT
+TATGTCAATCATCTAGCTAAATCGAGCTGCGAGCCGGAGAGTAAACAGTTTCCTTTTCTT
+CGGCGGTTATTTGAAAATTCCTTTCTTATGGCAGTGTTTCGAGCGAGCAGTATATTAGAC
+CCAACCTCGATAATCGTTAATCACATAGCGACTATGATAGTATCATTACCAGCAGCATAC
+ATAAAATTGTAAAGTGTGTTACTGTTTGCGTGGGTGATTATAGTACAGTCTTTTGCAAAT
+CTACGGCCCTGACAGAACTTCACATTAAAGGCCATCCACAGAACAATGGACAACGTATAA
+AACCTAAAAGGATATCGTTTTCCTGGGGTTTTCAGTTGTTTTAATGACCGGTAAATTTTC
+TTACCCTATTGTGTTTCCTTACACAGAAATATCTGAATATTGAGGTACCTGTGAACATTA
+TCATTCATACAACATATCCTATCGCCCATCCTGTGCGGCGACTACTCCAGCACTCACTAA
+TTGTTAATCATCTCATACAACTCGTCAGAATTAACATTACCGCAAACTGCTTACTAGCGC
+AATCAGGTCAAGAGGAGGACGGCTTTGTCACTTAAAAGAATAAGGTGTAGCTGCATAAAA
+CAATGTGTATCTTCTGAGCTTCACAGCCGTGGGCTATCTATGGTTCCGGTCCTGTTGATT
+GCTCCCGATGTTGAACAATACTTTCCACTTTCCGTGACAGAAACTTTAGAGCAAGAGGTC
+AAACTTTACCCAAGCCCATAGGTAGAAGTTACGCGCGCATTGACGTTTGATCAAGGGACA
+GCTGTGAATATCCGTCCCACGTAATCGTGACTTCTCATCAATATTATATTACTGCCGCTA
+ATCAACAACTTCCTTGTTTCGACTGAAACGATTTTAGTCAAGTCGAAGACCTCATACGAT
+AAGATTTGCAACATGTCTAAAAGAGAACGGGAACTGGCAAAAGGCTTGGTAGATCCGTCT
+ATAGCGTAAAACTGATTAACCCATTAGGTCTGAATAACTTTACACAACCCTCCGCACTGT
+TAAATGACGGGCTTTGCTCTGTTTTGACACATCAGCTAGAAACTCGCCACGAAGGCATAA
+GGCTCCCATATAGCGTAGCTGACAAACATATGAGGTGGCTGCATAAACTAAATTGAGGCT
+CGCGTTCGGATACTTGCCCATGTAGCAAGTCTTGGCAACCAACTATATAATCATCACGAA
+TTGAGTGCTAAAGACATGCGAACAGTTGGGGCTGCTATATAGTATGACAGATATAGAAAT
+TTTATAAAATGTCGTAGGAATCTGGAGGCCAAAATCATTAGACACTCTTGTAAAAGGTAT
+GGTAATGTGTATGACCTCTTGGCATAGTGTCCAATTATTCTCGGTTTACTCTCAGAGACA
+CAGTCATGTAAAAGTGGTGAGGAATTACCGCCGTGTTTTGCCAACCAAGAAGCATTGAAC
+AGTAGATCAATAATGATATTCGGTAGCGTATTTACGCTTTGCGGTTTTCAGAAGAAACTA
+TCACAATTGAAACTCTATTCTTCGCCTCATTCCGTACCGTTAGGAATGACTCGAATCGTA
+CTGTCTGCCGCGGGGCATAGTGTATTGCTCCCCACCAGGTTCAGATAGTTCGAATCAGTG
+CGCTGTACAATTGCCTTACGTGTAGATTTGCATCACCGCTTCACGTAGGCACCCAGAGTG
+CTCACTAAAGCCACTAGAGAGATAGAGTTAGAAATTAAGTATCGGTTACGCCCCTCAGAC
+GACATAACTCACTTCTACCGAATATCCTTTCTATCTTGGATACTACTAATGCTTCCGTTC
+ACGCCGCAATCATGTGGATCCTCCAGTAAGCAGGGTGCTGTCATGACTATACAGTACGGA
+TCCGTAAGCATTTTGAGGATGATAACATAGGGTCGGTTACTGTGGATTTCCGTTACTTAG
+GAGAGCAGCTTTAGCTGACTTTGCTGAGGCTGCGCGTGTTAGACAGCAATTTACGAACGG
+CGCACTCTATAGCAGGCACTCACAGTGGACCAGTAGTCCTATTGCAAGAGTTCATTATGG
+AACATTTTAGTCCTCTATCACACGGACCATTGCAGTAGATAACTCTAATCCTATGTCTTT
+ATTTGGTTGCCTGGAACCCCTTACCACTAGACACCCCAATAAGTAATCTTGCTTCCATGT
+CGAATTGATACTCATCGAAAACATATAAAACTAATTATGCTTGTGTTCCTGTGGTCTGTT
+ATATAGAGGCGCCCTATTGGCCGCGGGATAAGGATCATTTTGGCACACTAACGGGATCCT
+AAAACTTTATCTTTCAACGACTCCTACATGCCTTTTAGGTTAGTACGCGAATCGCCTAAC
+AAGCCAATGGGTATTGGAGAATTAGACAAAATGGTTGAGGAATAAAGTGGCGCAGGATTT
+TGTCCGAGAAAGGGATAGCAAACGGTCGCAGGCAGGAGTAACAATTTTCAACCGACCTTA
+ATAGAGCTCAAAAGCTACCGGAGAAAGCTTCGTCTATGCTTAATACATATGCTAACCTAT
+GAATTTCGTAAGCGTAATATAAACTTATCAGATATTTTAAAAGCATCCTATTCAGTCGTA
+CTTTTGGCAGGAAAGGTCAGGCGAAACAGAGTCTCCCTGCGGAGGCTTTTAAAATAAATA
+GCGGGCCTAGCATCGATTCTAAAAGACGACCCCAGGTGCGTAACCGTGCCTCCCCAAGTC
+TTCTTTTAACAATTACCTAGAGAACGGCGTCAGTCGCGAATGACCTTACGAACGTTTACG
+CGGAGCCGAGTAAGATTAATAACTGCTTATTGATTTGCAATCGTTTGATACGGGTGGCCC
+GAAGCTCAATATCAACATAAATAAAATTAGTCGGAATGGTCGCTTAAATCGCGCGCTGTC
+ACTGTCTTCATATGAGGGAGTTGTGTAAGACTGCATTGATATATAGGTATGATTTCGGTT
+TAGAACTTTGTCTGTTAGCAACTCCGCATGATTGAAGGAAATCCTCGTTGGTAAGATCTC
+TTTAGCATTTGCACAGCTGACTCTAACAGCATAGTATGTGATCGTATTATGTCTGCAGTT
+TGTAACACAGTGGGCGGCATGGATGGTACTTAATGGACGTAATGAGCAGTAGACCACCGG
+TGTTACCTAACCATCATTAGAGTAGGCGAGATTGCGCTTGTACGACTTATATATAAGGGT
+AACCGGAATACCGTTCCTCTTATCAACAACAGTTACTGGTCTTAATTCACATCGGATATT
+GCGATCGCCAAGACTATCCCGTAAGTCGTAAGCTAACCAACTAGCGGTTAGGTTTATTGA
+GGTTTTGATGGGAACTTCTCAGACACGTCGTCAACTACCTAATTTCTTGGATGGAGCTAG
+GCTAACTGTCCCAGAACTTTCTGACACTCGAGATCCTCTAACTAATTGGAATCCAGGAAT
+TCCCTTATTGCATCGCCACAAACGACCATAAATTACAGCATGTTTCATTGTCTAACGTGC
+CTATCCACGAAATTGAATTCGGTTCACATTATATATCCCCTTCTACCGCTAATTTAATGT
+TTAACGTTGATGGGGCAAAGCACATTCGAGAAGTACCGAAAAGTCTCAATCCAAAGACCG
+GAGGAACTGGCTTCGGTAAGAATCGCGAGTATCCTTGGATGCCCTGCCTGATTATAACTT
+GTTCCATGTAGATAGGCGTAGCTAATTCATAGCAATACAATAAACGAGTCAGAACTGTAG
+TCTAACATAACAGCCTGCTCTCCAGGTAACAGCCCATTATTAGATATAGTATCACGATCG
+TCGGTTGTATTAGTGGTGATAACTATCGATTCTGCCACTAATAGAATGTGCAGAAATAAA
+GTATCTGAAAGAAAACGAAGTCACAGAGAATAAAGCTCACTTCATAAAAGTCGGTTGCAG
+TAGACGCATATCAATTTTCCCTGCTGCATTTTAGAGTTCGGAATAGTTAAACATAATACT
+GGAAGCGCTTCCGGCAATCAGGAATAACCCCATATAAACCAACCTTTGTTGCTATTGCCA
+GCGCTATTCTCGTCAAAATTTCTCCCTATGGTCTTCACATCATGCATCACCGGACCCTTT
+GATAGACGATGACCCAATTACAATCACTCCACGGATGAGCATCCCATTTTATACGAGGCC
+CACTGGAAACAATTGCAATCGACGTGACCAAGTAGAGGAGCGTGCTCGAAAGGTGATGAT
+TGCCGAATTCTAACAAGGATACTATAAGCCACGGAACGCTGACGTTGAACAGACCTGGTC
+TCCTGGGCACTTCGCAGCACCTCAGTAGTAATTCCGGTAGATTAGGACTTAGCATTCCGT
+TGATCTTACAGGATTTATAAATAAGGAGATCTGTCTTGTTTAATTAGGAGGACGCTTTTC
+CCGCGTAAGTACGGGAAAACGTTCTTCTGATTTTGTTTGCCACTTGACATTGTAGCTGCT
+AGGAGAAGGGATAATATCCGCGTTTTCTTTTACCGTAACGTCGGAGCATACCATGGTAAT
+TGTCCGTGTCAAAACTAGATATCTAGGTTGCAAAATTCAGTCAGTAAGTCCTGAGGCCTT
+CCGCATTATTAATTCTACAGACATATGAATTTGCTCCACCGGCTAGCACAGTCAACTCAA
+CCCACGATAGGGGAACGAAATCACAAATAGGTTCACATGGTCAATACAAGGCAAACCATT
+CCCCATAACTCACGCACTGACGGTAAGGCCATTTCAGGTCAAGCGGTGAATGCTGTGAAA
+AGCAGCTCGACCACCTGCCGTGGATGGCAAACCGATAACAAAGGACTCCGATACTTCATT
+TGTAAACGTTTGCAGTGCTGACGTAACTCATATCTACAGTCAAACCGAATGGTTTGATCG
+GCATTATGTAAAGGAATCGACACACGTTGCGTCTTCTAGATTATTACACACCTGTCTGCG
+ACGGATATAGGTAAATAAGTCAGCCTCCACTCTGCAGAAGATACTAGAAACGTATCAGTA
+ATAGCTATCAGGATTTCGCCATCCTCGCACTGTGCCCGGATATCACAGCAAGATTCTAGG
+ATGGCACTTGTGTGACTAGAGGTTTTACTCGTTGAGCCATTCTTACTATAGGCATGGGAT
+TACAATGTGCATGTTTGTGATGTTATCCCATATCTTGCATGTATCAGCCTACCAATTAGA
+CATATGACTAGATGTAGTCGATCAACGCAAGGGTGCGGACTTTGATTCCTTTTGAATTGA
+AGTCAACTCAGATGCTCCTTAAGACGTTTTACAGTAGGTATTTTGTGGTACAAACCAGAA
+CCAGTGCCAGTCGGTAGTTATTGTAGTGTGTTCTTAATACATATTTGGTATTGGAGTTTC
+TAACATTTAAAAGGAGCCTATTACACTTACTTAATTTGCGTCTATATTTCTGTTACGATA
+TGTCGTCTGTCGATTTTACGAGTTTCATACGTGCGGGTTCCCTGTTCGCAATGGGCCCCT
+TGCTAATGTCCCGCATCTTTAGGATGCAAACTTACTCACGCCTCCTTTACCGAGACTTGG
+TGGGAGAGAAGACTCCTGTAGAATCCCGATCTGAATGGTTTCAGTGTAAGGGTCCCTTCT
+AGCCATATCATTGAATATTCTTGTACTTTAAGTAACTCGATCCTACCAGTACAATTCTAG
+GTTTGCCTTATAGCCGGAATGAGTATCAGCGTCATTCACCCCGGCCGGATATTATTTGCA
+ATGTCAGGGACACCCAAAATAGACCGGTTAGAAGGCATATGCGATGAGAGTTGGTGCCTA
+AATTAAACGATACAATTGATATGACAAGGACTATACGATGAAATCCATGAGATAATTATC
+GTAACTCGGCCAACCTAAAACCGTGCAAGATAGGAGCGGTCCTAGAAGTACTATCGACAC
+CTTAAATACTCACTTGAGTTTTCCGATCCTATAGTGCCAATCATATGGCGCAGGAATATT
+ACAAACTAAGAAAGTCAACAAAAGATGTAAATTGCAACACCTGGCATCGGTGGGGTTGTC
+CCCTTAAACCCTGAAACCAACTGTTATGCTCAACATTATATCGAGGCTAAAACGCGTATC
+GTGGCACATTAATAACGATCACATAAGCTTTGCGGCTAGCAATAATAATTTAGGACAGCT
+TAGATTTTGACCCGTGCTAATCCTCAGTATGGAGTAATTTTACGGATCTCTCGTTGTAAC
+CGTCCTCAGTCGTGTACATTTTAACCTTTGTAAACTAGTTTACGAACGAGTATTTAGAAG
+GTCCGTACTCTCACCCAACTGACACATTGTACTAGCTCAAGATCGCAAACACTAAGGGTG
+TGAGTCGCGGGATAGCGCTTAAATATGACTGCTAATGGTCAAGAGCACGCGCATAATATT
+CCACTGGTTCTAGGTCACCACTACGGTCAGACGTTGACCTGCATGCCCTACATCCGGCAC
+GGGCTACTAACGGCCTAATATTCTTTGAGCCATATCCATACTCGTCTATGCATATTCAGG
+TATACGGCTATAGTGCGTTATTAACTTCGTCGTGATTAAATCCTTTAATTGTTCCATTAT
+AAGTATACATGCTTAGATGCGTGAACTTGAGGGATATCGTTGCTCTAAAGTTGTCTTATA
+GACTAAATCTAAACAAGCCGTGCAAGACTACTTAAATTACAAATCTTACAGACATCTCGC
+CACTGCGCTAACACTAACAA
diff --git a/pipelines/nf-atacseq/tests/data/chr_test.fa.fai b/pipelines/nf-atacseq/tests/data/chr_test.fa.fai
deleted file mode 120000
index 8158c3c..0000000
--- a/pipelines/nf-atacseq/tests/data/chr_test.fa.fai
+++ /dev/null
@@ -1 +0,0 @@
-../../../../tests/shared_data/chr_test.fa.fai
\ No newline at end of file
diff --git a/pipelines/nf-atacseq/tests/data/chr_test.fa.fai b/pipelines/nf-atacseq/tests/data/chr_test.fa.fai
new file mode 100644
index 0000000..4e99d5b
--- /dev/null
+++ b/pipelines/nf-atacseq/tests/data/chr_test.fa.fai
@@ -0,0 +1 @@
+chr_test 20000 10 60 61
diff --git a/pipelines/nf-atacseq/tests/data/generate_realistic_reference.py b/pipelines/nf-atacseq/tests/data/generate_realistic_reference.py
new file mode 100644
index 0000000..cb9d937
--- /dev/null
+++ b/pipelines/nf-atacseq/tests/data/generate_realistic_reference.py
@@ -0,0 +1,123 @@
+#!/usr/bin/env python3
+"""
+Generate a realistic ~20kb non-repetitive reference sequence for ATAC-seq testing.
+
+Properties:
+ - ~42% GC content (human-like)
+ - No homopolymer runs > 5bp
+ - High k-mer uniqueness (>99% unique 20-mers)
+ - Deterministic (seeded RNG)
+
+Output: chr_test.fa with contig name 'chr_test'
+"""
+
+import random
+import sys
+
+SEED = 42
+LENGTH = 20000
+CONTIG = "chr_test"
+LINE_WIDTH = 60
+MAX_HOMOPOLYMER = 5
+
+# Target base frequencies for ~42% GC
+# A=29%, T=29%, G=21%, C=21%
+BASES = "ATGC"
+WEIGHTS = [0.29, 0.29, 0.21, 0.21]
+
+
+def generate_sequence(length, seed=SEED):
+ """Generate a non-repetitive sequence with controlled GC content."""
+ rng = random.Random(seed)
+
+ seq = []
+ homopolymer_count = 0
+ last_base = None
+
+ for _ in range(length):
+ # Pick a base using weighted random
+ base = rng.choices(BASES, weights=WEIGHTS, k=1)[0]
+
+ # Prevent long homopolymers
+ if base == last_base:
+ homopolymer_count += 1
+ if homopolymer_count >= MAX_HOMOPOLYMER:
+ # Force a different base
+ alternatives = [b for b in BASES if b != base]
+ alt_weights = [WEIGHTS[BASES.index(b)] for b in alternatives]
+ total = sum(alt_weights)
+ alt_weights = [w / total for w in alt_weights]
+ base = rng.choices(alternatives, weights=alt_weights, k=1)[0]
+ homopolymer_count = 1
+ else:
+ homopolymer_count = 1
+
+ seq.append(base)
+ last_base = base
+
+ return "".join(seq)
+
+
+def validate_sequence(seq):
+ """Validate sequence properties."""
+ gc = sum(1 for b in seq if b in "GC") / len(seq)
+
+ # Check k-mer uniqueness
+ kmers_20 = set()
+ for i in range(len(seq) - 19):
+ kmers_20.add(seq[i : i + 20])
+ unique_20 = len(kmers_20)
+ total_20 = len(seq) - 19
+ uniqueness = unique_20 / total_20
+
+ # Check max homopolymer
+ max_hp = 1
+ current_hp = 1
+ for i in range(1, len(seq)):
+ if seq[i] == seq[i - 1]:
+ current_hp += 1
+ max_hp = max(max_hp, current_hp)
+ else:
+ current_hp = 1
+
+ return {
+ "length": len(seq),
+ "gc_content": gc,
+ "unique_20mers": unique_20,
+ "total_20mers": total_20,
+ "uniqueness_pct": uniqueness * 100,
+ "max_homopolymer": max_hp,
+ }
+
+
+def write_fasta(seq, contig, filepath, line_width=LINE_WIDTH):
+ """Write sequence as FASTA."""
+ with open(filepath, "w") as f:
+ f.write(f">{contig}\n")
+ for i in range(0, len(seq), line_width):
+ f.write(seq[i : i + line_width] + "\n")
+
+
+def main():
+ output = sys.argv[1] if len(sys.argv) > 1 else "chr_test.fa"
+
+ print(f"Generating {LENGTH}bp non-repetitive reference sequence...")
+ seq = generate_sequence(LENGTH)
+
+ stats = validate_sequence(seq)
+ print(f" Length: {stats['length']}bp")
+ print(f" GC content: {stats['gc_content']:.1%}")
+ print(f" Unique 20-mers: {stats['unique_20mers']}/{stats['total_20mers']} ({stats['uniqueness_pct']:.1f}%)")
+ print(f" Max homopolymer: {stats['max_homopolymer']}bp")
+
+ # Validate
+ assert stats["gc_content"] > 0.38 and stats["gc_content"] < 0.46, f"GC content out of range: {stats['gc_content']}"
+ assert stats["uniqueness_pct"] > 99.0, f"Uniqueness too low: {stats['uniqueness_pct']}"
+ assert stats["max_homopolymer"] <= MAX_HOMOPOLYMER, f"Homopolymer too long: {stats['max_homopolymer']}"
+
+ write_fasta(seq, CONTIG, output)
+ print(f" Wrote {output}")
+
+
+if __name__ == "__main__":
+ main()
diff --git a/pipelines/nf-atacseq/tests/data/generate_test_data.sh b/pipelines/nf-atacseq/tests/data/generate_test_data.sh
index f5cb288..9cb2eb4 100755
--- a/pipelines/nf-atacseq/tests/data/generate_test_data.sh
+++ b/pipelines/nf-atacseq/tests/data/generate_test_data.sh
@@ -1,11 +1,18 @@
#!/bin/bash
# =============================================================================
-# WASP2 nf-atacseq Test Data Generator
+# WASP2 nf-atacseq Test Data Generator (v2 — realistic reference)
# =============================================================================
-# Creates ATAC-seq-like test data by symlinking shared core data and generating
-# pipeline-specific files (shorter fragment FASTQs, BWA index, samplesheet).
+# Generates self-contained ATAC-seq test data with a non-repetitive reference
+# so BWA alignment produces meaningful mapping rates (>80%).
#
-# Prerequisites: samtools, bgzip, tabix, wgsim, bwa (WASP2_dev2 conda env)
+# Previous version used the shared chr_test.fa which is a repetitive ATGC
+# pattern yielding ~0% mapping. This version generates its own reference.
+#
+# To produce non-zero allele counts, reads are simulated from BOTH haplotypes:
+# half from the REF haplotype, half from an ALT haplotype with het SNPs applied.
+#
+# Prerequisites: python3, samtools, bgzip, tabix, wgsim, bwa
+# (all available in WASP2_dev2 conda env or WASP2 micromamba env)
#
# Usage:
# cd pipelines/nf-atacseq/tests/data
@@ -17,106 +24,307 @@ set -euo pipefail
SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
cd "$SCRIPT_DIR"
-SHARED_DATA="../../../../tests/shared_data"
+# BWA may not be in PATH; check common conda/micromamba locations
+if ! command -v bwa &>/dev/null; then
+ for candidate in \
+ /usr/local/Cellar/micromamba/*/envs/WASP2/bin/bwa \
+ /usr/local/Cellar/micromamba/*/envs/WASP2_dev2/bin/bwa \
+ "${HOME}/miniforge3/envs/WASP2/bin/bwa" \
+ "${HOME}/miniconda3/envs/WASP2/bin/bwa"; do
+ if [[ -x "$candidate" ]]; then
+ export PATH="$(dirname "$candidate"):$PATH"
+ break
+ fi
+ done
+fi
echo "==================================================================="
-echo " WASP2 nf-atacseq Test Data Generator"
+echo " WASP2 nf-atacseq Test Data Generator (v2)"
echo "==================================================================="
-# Validate shared core data exists
-if [[ ! -f "$SHARED_DATA/chr_test.fa" ]]; then
- echo "ERROR: Shared core data not found at $SHARED_DATA"
- echo " Run: cd tests/shared_data && bash generate_core_data.sh"
- exit 1
-fi
-
# -----------------------------------------------------------------------------
-# Symlink shared reference and variants
+# Check prerequisites
# -----------------------------------------------------------------------------
-echo "[1/4] Symlinking shared reference data..."
+echo "[0/7] Checking prerequisites..."
+
+check_tool() {
+ if ! command -v "$1" &>/dev/null; then
+ echo "ERROR: $1 is required but not found in PATH"
+ echo " Try: conda activate WASP2_dev2"
+ exit 1
+ fi
+ echo " OK: $1"
+}
+
+check_tool python3
+check_tool samtools
+check_tool bwa
+check_tool wgsim
+check_tool bgzip
+check_tool tabix
+echo ""
+# -----------------------------------------------------------------------------
+# Clean stale symlinks and old data (one-time migration from v1)
+# -----------------------------------------------------------------------------
+echo "[1/7] Cleaning stale data..."
for f in chr_test.fa chr_test.fa.fai variants.vcf.gz variants.vcf.gz.tbi annotation.gtf regions.bed; do
- if [[ ! -e "$f" ]]; then
- ln -sf "$SHARED_DATA/$f" "$f"
- echo " ✓ Linked $f"
- else
- echo " - $f already exists"
+ if [[ -L "$f" ]]; then
+ rm -f "$f"
+ echo " Removed symlink: $f"
fi
done
+rm -rf bwa_index
+rm -f sample1_R1.fq.gz sample1_R2.fq.gz
+rm -f chr_test.fa chr_test.fa.fai variants.vcf variants.vcf.gz variants.vcf.gz.tbi regions.bed
+echo " Cleaned previous outputs"
+echo ""
+
+# -----------------------------------------------------------------------------
+# Generate realistic non-repetitive reference
+# -----------------------------------------------------------------------------
+echo "[2/7] Generating realistic reference genome..."
+python3 "${SCRIPT_DIR}/generate_realistic_reference.py" chr_test.fa
+samtools faidx chr_test.fa
+echo " Created chr_test.fa + .fai"
+echo ""
+# -----------------------------------------------------------------------------
+# Generate VCF with ~30 het SNPs + ALT haplotype reference
+# -----------------------------------------------------------------------------
+echo "[3/7] Creating VCF with 30 het SNPs and ALT haplotype..."
+
+python3 - <<'PYEOF'
+import random
+
+# Read reference
+with open("chr_test.fa") as f:
+ lines = f.readlines()
+seq = "".join(l.strip() for l in lines[1:])
+
+# Deterministic SNP positions spread across the reference
+rng = random.Random(99)
+positions = sorted(rng.sample(range(200, 19800), 30))
+
+# Transition mapping for plausible variants
+transitions = {"A": "G", "G": "A", "T": "C", "C": "T"}
+
+# --- Write VCF ---
+vcf_lines = []
+vcf_lines.append("##fileformat=VCFv4.2")
+vcf_lines.append("##source=WASP2_nf_atacseq_test_data_v2")
+vcf_lines.append("##reference=chr_test.fa")
+vcf_lines.append("##contig=