diff --git a/docs/_static/preprocess_rulegraph_no_qc.svg b/docs/_static/preprocess_no_qc_rulegraph.svg
similarity index 65%
rename from docs/_static/preprocess_rulegraph_no_qc.svg
rename to docs/_static/preprocess_no_qc_rulegraph.svg
index 6ddf980d..c631689f 100644
--- a/docs/_static/preprocess_rulegraph_no_qc.svg
+++ b/docs/_static/preprocess_no_qc_rulegraph.svg
@@ -1,7 +1,7 @@
 <?xml version="1.0" encoding="UTF-8" standalone="no"?>
 <!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN"
  "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
-<!-- Generated by graphviz version 9.0.0 (20230911.1827)
+<!-- Generated by graphviz version 11.0.0 (20240428.1522)
  -->
 <!-- Title: snakemake_dag Pages: 1 -->
 <svg width="362pt" height="548pt"
@@ -12,17 +12,17 @@
 <!-- 0 -->
 <g id="node1" class="node">
 <title>0</title>
-<path fill="none" stroke="#d8b456" stroke-width="2" d="M222,-36C222,-36 192,-36 192,-36 186,-36 180,-30 180,-24 180,-24 180,-12 180,-12 180,-6 186,0 192,0 192,0 222,0 222,0 228,0 234,-6 234,-12 234,-12 234,-24 234,-24 234,-30 228,-36 222,-36"/>
+<path fill="none" stroke="black" stroke-width="2" d="M222,-36C222,-36 192,-36 192,-36 186,-36 180,-30 180,-24 180,-24 180,-12 180,-12 180,-6 186,0 192,0 192,0 222,0 222,0 228,0 234,-6 234,-12 234,-12 234,-24 234,-24 234,-30 228,-36 222,-36"/>
 <text text-anchor="middle" x="207" y="-14.12" font-family="sans" font-size="10.00">all</text>
 </g>
 <!-- 1 -->
 <g id="node2" class="node">
 <title>1</title>
-<path fill="none" stroke="#56d86b" stroke-width="2" d="M166.5,-108C166.5,-108 87.5,-108 87.5,-108 81.5,-108 75.5,-102 75.5,-96 75.5,-96 75.5,-84 75.5,-84 75.5,-78 81.5,-72 87.5,-72 87.5,-72 166.5,-72 166.5,-72 172.5,-72 178.5,-78 178.5,-84 178.5,-84 178.5,-96 178.5,-96 178.5,-102 172.5,-108 166.5,-108"/>
+<path fill="none" stroke="black" stroke-width="2" d="M166.5,-108C166.5,-108 87.5,-108 87.5,-108 81.5,-108 75.5,-102 75.5,-96 75.5,-96 75.5,-84 75.5,-84 75.5,-78 81.5,-72 87.5,-72 87.5,-72 166.5,-72 166.5,-72 172.5,-72 178.5,-78 178.5,-84 178.5,-84 178.5,-96 178.5,-96 178.5,-102 172.5,-108 166.5,-108"/>
 <text text-anchor="middle" x="127" y="-86.12" font-family="sans" font-size="10.00">combine_genotypes</text>
 </g>
 <!-- 1&#45;&gt;0 -->
-<g id="edge2" class="edge">
+<g id="edge3" class="edge">
 <title>1&#45;&gt;0</title>
 <path fill="none" stroke="grey" stroke-width="2" d="M147.19,-71.34C156.21,-63.44 167.04,-53.96 176.99,-45.26"/>
 <polygon fill="grey" stroke="grey" stroke-width="2" points="179.04,-48.11 184.26,-38.9 174.43,-42.85 179.04,-48.11"/>
@@ -30,8 +30,8 @@
 <!-- 2 -->
 <g id="node3" class="node">
 <title>2</title>
-<path fill="none" stroke="#56d89a" stroke-width="2" d="M162.75,-180C162.75,-180 91.25,-180 91.25,-180 85.25,-180 79.25,-174 79.25,-168 79.25,-168 79.25,-156 79.25,-156 79.25,-150 85.25,-144 91.25,-144 91.25,-144 162.75,-144 162.75,-144 168.75,-144 174.75,-150 174.75,-156 174.75,-156 174.75,-168 174.75,-168 174.75,-174 168.75,-180 162.75,-180"/>
-<text text-anchor="middle" x="127" y="-158.12" font-family="sans" font-size="10.00">preprocess_no_qc</text>
+<path fill="none" stroke="black" stroke-width="2" d="M147,-180C147,-180 107,-180 107,-180 101,-180 95,-174 95,-168 95,-168 95,-156 95,-156 95,-150 101,-144 107,-144 107,-144 147,-144 147,-144 153,-144 159,-150 159,-156 159,-156 159,-168 159,-168 159,-174 153,-180 147,-180"/>
+<text text-anchor="middle" x="127" y="-158.12" font-family="sans" font-size="10.00">preprocess</text>
 </g>
 <!-- 2&#45;&gt;1 -->
 <g id="edge4" class="edge">
@@ -42,25 +42,25 @@
 <!-- 3 -->
 <g id="node4" class="node">
 <title>3</title>
-<path fill="none" stroke="#70d856" stroke-width="2" d="M342.12,-252C342.12,-252 281.88,-252 281.88,-252 275.88,-252 269.88,-246 269.88,-240 269.88,-240 269.88,-228 269.88,-228 269.88,-222 275.88,-216 281.88,-216 281.88,-216 342.12,-216 342.12,-216 348.12,-216 354.12,-222 354.12,-228 354.12,-228 354.12,-240 354.12,-240 354.12,-246 348.12,-252 342.12,-252"/>
+<path fill="none" stroke="black" stroke-width="2" d="M342.12,-252C342.12,-252 281.88,-252 281.88,-252 275.88,-252 269.88,-246 269.88,-240 269.88,-240 269.88,-228 269.88,-228 269.88,-222 275.88,-216 281.88,-216 281.88,-216 342.12,-216 342.12,-216 348.12,-216 354.12,-222 354.12,-228 354.12,-228 354.12,-240 354.12,-240 354.12,-246 348.12,-252 342.12,-252"/>
 <text text-anchor="middle" x="312" y="-230.12" font-family="sans" font-size="10.00">add_variant_ids</text>
 </g>
 <!-- 3&#45;&gt;0 -->
-<g id="edge3" class="edge">
+<g id="edge1" class="edge">
 <title>3&#45;&gt;0</title>
 <path fill="none" stroke="grey" stroke-width="2" d="M303.23,-215.12C285.16,-178.3 243.65,-93.69 221.51,-48.58"/>
 <polygon fill="grey" stroke="grey" stroke-width="2" points="224.7,-47.13 217.15,-39.69 218.42,-50.21 224.7,-47.13"/>
 </g>
 <!-- 3&#45;&gt;2 -->
-<g id="edge8" class="edge">
+<g id="edge5" class="edge">
 <title>3&#45;&gt;2</title>
-<path fill="none" stroke="grey" stroke-width="2" d="M269.09,-216.76C244.56,-207.48 213.43,-195.7 186.56,-185.54"/>
-<polygon fill="grey" stroke="grey" stroke-width="2" points="187.97,-182.33 177.38,-182.06 185.5,-188.88 187.97,-182.33"/>
+<path fill="none" stroke="grey" stroke-width="2" d="M269.09,-216.76C239.95,-205.74 201.49,-191.19 171.93,-180"/>
+<polygon fill="grey" stroke="grey" stroke-width="2" points="173.28,-176.77 162.69,-176.51 170.81,-183.32 173.28,-176.77"/>
 </g>
 <!-- 4 -->
 <g id="node5" class="node">
 <title>4</title>
-<path fill="none" stroke="#d85656" stroke-width="2" d="M241.5,-324C241.5,-324 156.5,-324 156.5,-324 150.5,-324 144.5,-318 144.5,-312 144.5,-312 144.5,-300 144.5,-300 144.5,-294 150.5,-288 156.5,-288 156.5,-288 241.5,-288 241.5,-288 247.5,-288 253.5,-294 253.5,-300 253.5,-300 253.5,-312 253.5,-312 253.5,-318 247.5,-324 241.5,-324"/>
+<path fill="none" stroke="black" stroke-width="2" d="M241.5,-324C241.5,-324 156.5,-324 156.5,-324 150.5,-324 144.5,-318 144.5,-312 144.5,-312 144.5,-300 144.5,-300 144.5,-294 150.5,-288 156.5,-288 156.5,-288 241.5,-288 241.5,-288 247.5,-288 253.5,-294 253.5,-300 253.5,-300 253.5,-312 253.5,-312 253.5,-318 247.5,-324 241.5,-324"/>
 <text text-anchor="middle" x="199" y="-302.12" font-family="sans" font-size="10.00">concatenate_variants</text>
 </g>
 <!-- 4&#45;&gt;3 -->
@@ -72,7 +72,7 @@
 <!-- 9 -->
 <g id="node10" class="node">
 <title>9</title>
-<path fill="none" stroke="#d88556" stroke-width="2" d="M239.5,-252C239.5,-252 130.5,-252 130.5,-252 124.5,-252 118.5,-246 118.5,-240 118.5,-240 118.5,-228 118.5,-228 118.5,-222 124.5,-216 130.5,-216 130.5,-216 239.5,-216 239.5,-216 245.5,-216 251.5,-222 251.5,-228 251.5,-228 251.5,-240 251.5,-240 251.5,-246 245.5,-252 239.5,-252"/>
+<path fill="none" stroke="black" stroke-width="2" d="M239.5,-252C239.5,-252 130.5,-252 130.5,-252 124.5,-252 118.5,-246 118.5,-240 118.5,-240 118.5,-228 118.5,-228 118.5,-222 124.5,-216 130.5,-216 130.5,-216 239.5,-216 239.5,-216 245.5,-216 251.5,-222 251.5,-228 251.5,-228 251.5,-240 251.5,-240 251.5,-246 245.5,-252 239.5,-252"/>
 <text text-anchor="middle" x="185" y="-230.12" font-family="sans" font-size="10.00">create_parquet_variant_ids</text>
 </g>
 <!-- 4&#45;&gt;9 -->
@@ -84,7 +84,7 @@
 <!-- 5 -->
 <g id="node6" class="node">
 <title>5</title>
-<path fill="none" stroke="#9fd856" stroke-width="2" d="M201,-396C201,-396 171,-396 171,-396 165,-396 159,-390 159,-384 159,-384 159,-372 159,-372 159,-366 165,-360 171,-360 171,-360 201,-360 201,-360 207,-360 213,-366 213,-372 213,-372 213,-384 213,-384 213,-390 207,-396 201,-396"/>
+<path fill="none" stroke="black" stroke-width="2" d="M201,-396C201,-396 171,-396 171,-396 165,-396 159,-390 159,-384 159,-384 159,-372 159,-372 159,-366 165,-360 171,-360 171,-360 201,-360 201,-360 207,-360 213,-366 213,-372 213,-372 213,-384 213,-384 213,-390 207,-396 201,-396"/>
 <text text-anchor="middle" x="186" y="-374.12" font-family="sans" font-size="10.00">variants</text>
 </g>
 <!-- 5&#45;&gt;4 -->
@@ -96,7 +96,7 @@
 <!-- 6 -->
 <g id="node7" class="node">
 <title>6</title>
-<path fill="none" stroke="#56d8c9" stroke-width="2" d="M137,-468C137,-468 103,-468 103,-468 97,-468 91,-462 91,-456 91,-456 91,-444 91,-444 91,-438 97,-432 103,-432 103,-432 137,-432 137,-432 143,-432 149,-438 149,-444 149,-444 149,-456 149,-456 149,-462 143,-468 137,-468"/>
+<path fill="none" stroke="black" stroke-width="2" d="M137,-468C137,-468 103,-468 103,-468 97,-468 91,-462 91,-456 91,-456 91,-444 91,-444 91,-438 97,-432 103,-432 103,-432 137,-432 137,-432 143,-432 149,-438 149,-444 149,-444 149,-456 149,-456 149,-462 143,-468 137,-468"/>
 <text text-anchor="middle" x="120" y="-446.12" font-family="sans" font-size="10.00">normalize</text>
 </g>
 <!-- 6&#45;&gt;5 -->
@@ -108,7 +108,7 @@
 <!-- 10 -->
 <g id="node11" class="node">
 <title>10</title>
-<path fill="none" stroke="#ced856" stroke-width="2" d="M114,-324C114,-324 84,-324 84,-324 78,-324 72,-318 72,-312 72,-312 72,-300 72,-300 72,-294 78,-288 84,-288 84,-288 114,-288 114,-288 120,-288 126,-294 126,-300 126,-300 126,-312 126,-312 126,-318 120,-324 114,-324"/>
+<path fill="none" stroke="black" stroke-width="2" d="M114,-324C114,-324 84,-324 84,-324 78,-324 72,-318 72,-312 72,-312 72,-300 72,-300 72,-294 78,-288 84,-288 84,-288 114,-288 114,-288 120,-288 126,-294 126,-300 126,-300 126,-312 126,-312 126,-318 120,-324 114,-324"/>
 <text text-anchor="middle" x="99" y="-302.12" font-family="sans" font-size="10.00">sparsify</text>
 </g>
 <!-- 6&#45;&gt;10 -->
@@ -120,17 +120,17 @@
 <!-- 7 -->
 <g id="node8" class="node">
 <title>7</title>
-<path fill="none" stroke="#5682d8" stroke-width="2" d="M76,-540C76,-540 12,-540 12,-540 6,-540 0,-534 0,-528 0,-528 0,-516 0,-516 0,-510 6,-504 12,-504 12,-504 76,-504 76,-504 82,-504 88,-510 88,-516 88,-516 88,-528 88,-528 88,-534 82,-540 76,-540"/>
+<path fill="none" stroke="black" stroke-width="2" d="M76,-540C76,-540 12,-540 12,-540 6,-540 0,-534 0,-528 0,-528 0,-516 0,-516 0,-510 6,-504 12,-504 12,-504 76,-504 76,-504 82,-504 88,-510 88,-516 88,-516 88,-528 88,-528 88,-534 82,-540 76,-540"/>
 <text text-anchor="middle" x="44" y="-518.12" font-family="sans" font-size="10.00">extract_samples</text>
 </g>
 <!-- 7&#45;&gt;2 -->
-<g id="edge6" class="edge">
+<g id="edge7" class="edge">
 <title>7&#45;&gt;2</title>
 <path fill="none" stroke="grey" stroke-width="2" d="M44,-503.07C44,-476.13 44,-423.62 44,-379 44,-379 44,-379 44,-305 44,-260.18 75.2,-216.95 99.34,-190.2"/>
 <polygon fill="grey" stroke="grey" stroke-width="2" points="101.81,-192.68 106.1,-182.99 96.7,-187.89 101.81,-192.68"/>
 </g>
 <!-- 7&#45;&gt;6 -->
-<g id="edge12" class="edge">
+<g id="edge13" class="edge">
 <title>7&#45;&gt;6</title>
 <path fill="none" stroke="grey" stroke-width="2" d="M63.18,-503.34C71.66,-495.52 81.82,-486.16 91.19,-477.53"/>
 <polygon fill="grey" stroke="grey" stroke-width="2" points="93.35,-480.3 98.34,-470.95 88.61,-475.15 93.35,-480.3"/>
@@ -138,29 +138,29 @@
 <!-- 8 -->
 <g id="node9" class="node">
 <title>8</title>
-<path fill="none" stroke="#56b1d8" stroke-width="2" d="M160.12,-540C160.12,-540 117.88,-540 117.88,-540 111.88,-540 105.88,-534 105.88,-528 105.88,-528 105.88,-516 105.88,-516 105.88,-510 111.88,-504 117.88,-504 117.88,-504 160.12,-504 160.12,-504 166.12,-504 172.12,-510 172.12,-516 172.12,-516 172.12,-528 172.12,-528 172.12,-534 166.12,-540 160.12,-540"/>
+<path fill="none" stroke="black" stroke-width="2" d="M160.12,-540C160.12,-540 117.88,-540 117.88,-540 111.88,-540 105.88,-534 105.88,-528 105.88,-528 105.88,-516 105.88,-516 105.88,-510 111.88,-504 117.88,-504 117.88,-504 160.12,-504 160.12,-504 166.12,-504 172.12,-510 172.12,-516 172.12,-516 172.12,-528 172.12,-528 172.12,-534 166.12,-540 160.12,-540"/>
 <text text-anchor="middle" x="139" y="-518.12" font-family="sans" font-size="10.00">index_fasta</text>
 </g>
 <!-- 8&#45;&gt;6 -->
-<g id="edge13" class="edge">
+<g id="edge12" class="edge">
 <title>8&#45;&gt;6</title>
 <path fill="none" stroke="grey" stroke-width="2" d="M134.21,-503.34C132.4,-496.67 130.28,-488.89 128.25,-481.39"/>
 <polygon fill="grey" stroke="grey" stroke-width="2" points="131.65,-480.56 125.65,-471.82 124.89,-482.39 131.65,-480.56"/>
 </g>
 <!-- 9&#45;&gt;0 -->
-<g id="edge1" class="edge">
+<g id="edge2" class="edge">
 <title>9&#45;&gt;0</title>
 <path fill="none" stroke="grey" stroke-width="2" d="M186.84,-215.12C190.59,-178.62 199.17,-95.13 203.84,-49.74"/>
 <polygon fill="grey" stroke="grey" stroke-width="2" points="207.3,-50.29 204.84,-39.99 200.34,-49.58 207.3,-50.29"/>
 </g>
 <!-- 9&#45;&gt;2 -->
-<g id="edge5" class="edge">
+<g id="edge6" class="edge">
 <title>9&#45;&gt;2</title>
 <path fill="none" stroke="grey" stroke-width="2" d="M170.36,-215.34C164.23,-207.93 156.95,-199.14 150.12,-190.9"/>
 <polygon fill="grey" stroke="grey" stroke-width="2" points="152.84,-188.7 143.76,-183.23 147.45,-193.17 152.84,-188.7"/>
 </g>
 <!-- 10&#45;&gt;2 -->
-<g id="edge7" class="edge">
+<g id="edge8" class="edge">
 <title>10&#45;&gt;2</title>
 <path fill="none" stroke="grey" stroke-width="2" d="M100.22,-287.1C101.69,-269.01 104.64,-240.33 110,-216 111.66,-208.48 113.93,-200.5 116.28,-193.08"/>
 <polygon fill="grey" stroke="grey" stroke-width="2" points="119.53,-194.39 119.37,-183.79 112.89,-192.17 119.53,-194.39"/>
diff --git a/docs/_static/preprocess_rulegraph_with_qc.svg b/docs/_static/preprocess_with_qc_rulegraph.svg
similarity index 61%
rename from docs/_static/preprocess_rulegraph_with_qc.svg
rename to docs/_static/preprocess_with_qc_rulegraph.svg
index 167d7839..24d6061c 100644
--- a/docs/_static/preprocess_rulegraph_with_qc.svg
+++ b/docs/_static/preprocess_with_qc_rulegraph.svg
@@ -1,7 +1,7 @@
 <?xml version="1.0" encoding="UTF-8" standalone="no"?>
 <!DOCTYPE svg PUBLIC "-//W3C//DTD SVG 1.1//EN"
  "http://www.w3.org/Graphics/SVG/1.1/DTD/svg11.dtd">
-<!-- Generated by graphviz version 9.0.0 (20230911.1827)
+<!-- Generated by graphviz version 11.0.0 (20240428.1522)
  -->
 <!-- Title: snakemake_dag Pages: 1 -->
 <svg width="621pt" height="548pt"
@@ -12,13 +12,13 @@
 <!-- 0 -->
 <g id="node1" class="node">
 <title>0</title>
-<path fill="none" stroke="#68d856" stroke-width="2" d="M449,-36C449,-36 419,-36 419,-36 413,-36 407,-30 407,-24 407,-24 407,-12 407,-12 407,-6 413,0 419,0 419,0 449,0 449,0 455,0 461,-6 461,-12 461,-12 461,-24 461,-24 461,-30 455,-36 449,-36"/>
+<path fill="none" stroke="black" stroke-width="2" d="M449,-36C449,-36 419,-36 419,-36 413,-36 407,-30 407,-24 407,-24 407,-12 407,-12 407,-6 413,0 419,0 419,0 449,0 449,0 455,0 461,-6 461,-12 461,-12 461,-24 461,-24 461,-30 455,-36 449,-36"/>
 <text text-anchor="middle" x="434" y="-14.12" font-family="sans" font-size="10.00">all</text>
 </g>
 <!-- 1 -->
 <g id="node2" class="node">
 <title>1</title>
-<path fill="none" stroke="#56d8c1" stroke-width="2" d="M333.5,-108C333.5,-108 254.5,-108 254.5,-108 248.5,-108 242.5,-102 242.5,-96 242.5,-96 242.5,-84 242.5,-84 242.5,-78 248.5,-72 254.5,-72 254.5,-72 333.5,-72 333.5,-72 339.5,-72 345.5,-78 345.5,-84 345.5,-84 345.5,-96 345.5,-96 345.5,-102 339.5,-108 333.5,-108"/>
+<path fill="none" stroke="black" stroke-width="2" d="M333.5,-108C333.5,-108 254.5,-108 254.5,-108 248.5,-108 242.5,-102 242.5,-96 242.5,-96 242.5,-84 242.5,-84 242.5,-78 248.5,-72 254.5,-72 254.5,-72 333.5,-72 333.5,-72 339.5,-72 345.5,-78 345.5,-84 345.5,-84 345.5,-96 345.5,-96 345.5,-102 339.5,-108 333.5,-108"/>
 <text text-anchor="middle" x="294" y="-86.12" font-family="sans" font-size="10.00">combine_genotypes</text>
 </g>
 <!-- 1&#45;&gt;0 -->
@@ -30,8 +30,8 @@
 <!-- 2 -->
 <g id="node3" class="node">
 <title>2</title>
-<path fill="none" stroke="#88d856" stroke-width="2" d="M302.5,-180C302.5,-180 223.5,-180 223.5,-180 217.5,-180 211.5,-174 211.5,-168 211.5,-168 211.5,-156 211.5,-156 211.5,-150 217.5,-144 223.5,-144 223.5,-144 302.5,-144 302.5,-144 308.5,-144 314.5,-150 314.5,-156 314.5,-156 314.5,-168 314.5,-168 314.5,-174 308.5,-180 302.5,-180"/>
-<text text-anchor="middle" x="263" y="-158.12" font-family="sans" font-size="10.00">preprocess_with_qc</text>
+<path fill="none" stroke="black" stroke-width="2" d="M283,-180C283,-180 243,-180 243,-180 237,-180 231,-174 231,-168 231,-168 231,-156 231,-156 231,-150 237,-144 243,-144 243,-144 283,-144 283,-144 289,-144 295,-150 295,-156 295,-156 295,-168 295,-168 295,-174 289,-180 283,-180"/>
+<text text-anchor="middle" x="263" y="-158.12" font-family="sans" font-size="10.00">preprocess</text>
 </g>
 <!-- 2&#45;&gt;1 -->
 <g id="edge4" class="edge">
@@ -42,7 +42,7 @@
 <!-- 3 -->
 <g id="node4" class="node">
 <title>3</title>
-<path fill="none" stroke="#d89556" stroke-width="2" d="M591.12,-252C591.12,-252 530.88,-252 530.88,-252 524.88,-252 518.88,-246 518.88,-240 518.88,-240 518.88,-228 518.88,-228 518.88,-222 524.88,-216 530.88,-216 530.88,-216 591.12,-216 591.12,-216 597.12,-216 603.12,-222 603.12,-228 603.12,-228 603.12,-240 603.12,-240 603.12,-246 597.12,-252 591.12,-252"/>
+<path fill="none" stroke="black" stroke-width="2" d="M591.12,-252C591.12,-252 530.88,-252 530.88,-252 524.88,-252 518.88,-246 518.88,-240 518.88,-240 518.88,-228 518.88,-228 518.88,-222 524.88,-216 530.88,-216 530.88,-216 591.12,-216 591.12,-216 597.12,-216 603.12,-222 603.12,-228 603.12,-228 603.12,-240 603.12,-240 603.12,-246 597.12,-252 591.12,-252"/>
 <text text-anchor="middle" x="561" y="-230.12" font-family="sans" font-size="10.00">add_variant_ids</text>
 </g>
 <!-- 3&#45;&gt;0 -->
@@ -54,13 +54,13 @@
 <!-- 3&#45;&gt;2 -->
 <g id="edge5" class="edge">
 <title>3&#45;&gt;2</title>
-<path fill="none" stroke="grey" stroke-width="2" d="M517.97,-218.29C515.28,-217.48 512.61,-216.71 510,-216 448.89,-199.31 378.12,-184.59 328.03,-174.92"/>
-<polygon fill="grey" stroke="grey" stroke-width="2" points="328.9,-171.52 318.42,-173.08 327.58,-178.4 328.9,-171.52"/>
+<path fill="none" stroke="grey" stroke-width="2" d="M517.97,-218.29C515.28,-217.48 512.61,-216.71 510,-216 440.29,-196.96 357.98,-180.48 308.18,-171.14"/>
+<polygon fill="grey" stroke="grey" stroke-width="2" points="309.09,-167.75 298.62,-169.37 307.81,-174.63 309.09,-167.75"/>
 </g>
 <!-- 4 -->
 <g id="node5" class="node">
 <title>4</title>
-<path fill="none" stroke="#56d0d8" stroke-width="2" d="M600.5,-324C600.5,-324 515.5,-324 515.5,-324 509.5,-324 503.5,-318 503.5,-312 503.5,-312 503.5,-300 503.5,-300 503.5,-294 509.5,-288 515.5,-288 515.5,-288 600.5,-288 600.5,-288 606.5,-288 612.5,-294 612.5,-300 612.5,-300 612.5,-312 612.5,-312 612.5,-318 606.5,-324 600.5,-324"/>
+<path fill="none" stroke="black" stroke-width="2" d="M600.5,-324C600.5,-324 515.5,-324 515.5,-324 509.5,-324 503.5,-318 503.5,-312 503.5,-312 503.5,-300 503.5,-300 503.5,-294 509.5,-288 515.5,-288 515.5,-288 600.5,-288 600.5,-288 606.5,-288 612.5,-294 612.5,-300 612.5,-300 612.5,-312 612.5,-312 612.5,-318 606.5,-324 600.5,-324"/>
 <text text-anchor="middle" x="558" y="-302.12" font-family="sans" font-size="10.00">concatenate_variants</text>
 </g>
 <!-- 4&#45;&gt;3 -->
@@ -72,7 +72,7 @@
 <!-- 9 -->
 <g id="node10" class="node">
 <title>9</title>
-<path fill="none" stroke="#d8b456" stroke-width="2" d="M488.5,-252C488.5,-252 379.5,-252 379.5,-252 373.5,-252 367.5,-246 367.5,-240 367.5,-240 367.5,-228 367.5,-228 367.5,-222 373.5,-216 379.5,-216 379.5,-216 488.5,-216 488.5,-216 494.5,-216 500.5,-222 500.5,-228 500.5,-228 500.5,-240 500.5,-240 500.5,-246 494.5,-252 488.5,-252"/>
+<path fill="none" stroke="black" stroke-width="2" d="M488.5,-252C488.5,-252 379.5,-252 379.5,-252 373.5,-252 367.5,-246 367.5,-240 367.5,-240 367.5,-228 367.5,-228 367.5,-222 373.5,-216 379.5,-216 379.5,-216 488.5,-216 488.5,-216 494.5,-216 500.5,-222 500.5,-228 500.5,-228 500.5,-240 500.5,-240 500.5,-246 494.5,-252 488.5,-252"/>
 <text text-anchor="middle" x="434" y="-230.12" font-family="sans" font-size="10.00">create_parquet_variant_ids</text>
 </g>
 <!-- 4&#45;&gt;9 -->
@@ -84,7 +84,7 @@
 <!-- 5 -->
 <g id="node6" class="node">
 <title>5</title>
-<path fill="none" stroke="#d85656" stroke-width="2" d="M536,-396C536,-396 506,-396 506,-396 500,-396 494,-390 494,-384 494,-384 494,-372 494,-372 494,-366 500,-360 506,-360 506,-360 536,-360 536,-360 542,-360 548,-366 548,-372 548,-372 548,-384 548,-384 548,-390 542,-396 536,-396"/>
+<path fill="none" stroke="black" stroke-width="2" d="M536,-396C536,-396 506,-396 506,-396 500,-396 494,-390 494,-384 494,-384 494,-372 494,-372 494,-366 500,-360 506,-360 506,-360 536,-360 536,-360 542,-360 548,-366 548,-372 548,-372 548,-384 548,-384 548,-390 542,-396 536,-396"/>
 <text text-anchor="middle" x="521" y="-374.12" font-family="sans" font-size="10.00">variants</text>
 </g>
 <!-- 5&#45;&gt;4 -->
@@ -96,7 +96,7 @@
 <!-- 6 -->
 <g id="node7" class="node">
 <title>6</title>
-<path fill="none" stroke="#56b1d8" stroke-width="2" d="M217,-468C217,-468 183,-468 183,-468 177,-468 171,-462 171,-456 171,-456 171,-444 171,-444 171,-438 177,-432 183,-432 183,-432 217,-432 217,-432 223,-432 229,-438 229,-444 229,-444 229,-456 229,-456 229,-462 223,-468 217,-468"/>
+<path fill="none" stroke="black" stroke-width="2" d="M217,-468C217,-468 183,-468 183,-468 177,-468 171,-462 171,-456 171,-456 171,-444 171,-444 171,-438 177,-432 183,-432 183,-432 217,-432 217,-432 223,-432 229,-438 229,-444 229,-444 229,-456 229,-456 229,-462 223,-468 217,-468"/>
 <text text-anchor="middle" x="200" y="-446.12" font-family="sans" font-size="10.00">normalize</text>
 </g>
 <!-- 6&#45;&gt;5 -->
@@ -108,7 +108,7 @@
 <!-- 10 -->
 <g id="node11" class="node">
 <title>10</title>
-<path fill="none" stroke="#5673d8" stroke-width="2" d="M70,-324C70,-324 40,-324 40,-324 34,-324 28,-318 28,-312 28,-312 28,-300 28,-300 28,-294 34,-288 40,-288 40,-288 70,-288 70,-288 76,-288 82,-294 82,-300 82,-300 82,-312 82,-312 82,-318 76,-324 70,-324"/>
+<path fill="none" stroke="black" stroke-width="2" d="M70,-324C70,-324 40,-324 40,-324 34,-324 28,-318 28,-312 28,-312 28,-300 28,-300 28,-294 34,-288 40,-288 40,-288 70,-288 70,-288 76,-288 82,-294 82,-300 82,-300 82,-312 82,-312 82,-318 76,-324 70,-324"/>
 <text text-anchor="middle" x="55" y="-302.12" font-family="sans" font-size="10.00">sparsify</text>
 </g>
 <!-- 6&#45;&gt;10 -->
@@ -120,7 +120,7 @@
 <!-- 11 -->
 <g id="node12" class="node">
 <title>11</title>
-<path fill="none" stroke="#56d882" stroke-width="2" d="M125.12,-252C125.12,-252 82.88,-252 82.88,-252 76.88,-252 70.88,-246 70.88,-240 70.88,-240 70.88,-228 70.88,-228 70.88,-222 76.88,-216 82.88,-216 82.88,-216 125.12,-216 125.12,-216 131.12,-216 137.12,-222 137.12,-228 137.12,-228 137.12,-240 137.12,-240 137.12,-246 131.12,-252 125.12,-252"/>
+<path fill="none" stroke="black" stroke-width="2" d="M125.12,-252C125.12,-252 82.88,-252 82.88,-252 76.88,-252 70.88,-246 70.88,-240 70.88,-240 70.88,-228 70.88,-228 70.88,-222 76.88,-216 82.88,-216 82.88,-216 125.12,-216 125.12,-216 131.12,-216 137.12,-222 137.12,-228 137.12,-228 137.12,-240 137.12,-240 137.12,-246 131.12,-252 125.12,-252"/>
 <text text-anchor="middle" x="104" y="-230.12" font-family="sans" font-size="10.00">qc_varmiss</text>
 </g>
 <!-- 6&#45;&gt;11 -->
@@ -132,7 +132,7 @@
 <!-- 12 -->
 <g id="node13" class="node">
 <title>12</title>
-<path fill="none" stroke="#56d8a2" stroke-width="2" d="M180,-324C180,-324 150,-324 150,-324 144,-324 138,-318 138,-312 138,-312 138,-300 138,-300 138,-294 144,-288 150,-288 150,-288 180,-288 180,-288 186,-288 192,-294 192,-300 192,-300 192,-312 192,-312 192,-318 186,-324 180,-324"/>
+<path fill="none" stroke="black" stroke-width="2" d="M180,-324C180,-324 150,-324 150,-324 144,-324 138,-318 138,-312 138,-312 138,-300 138,-300 138,-294 144,-288 150,-288 150,-288 180,-288 180,-288 186,-288 192,-294 192,-300 192,-300 192,-312 192,-312 192,-318 186,-324 180,-324"/>
 <text text-anchor="middle" x="165" y="-302.12" font-family="sans" font-size="10.00">qc_hwe</text>
 </g>
 <!-- 6&#45;&gt;12 -->
@@ -144,7 +144,7 @@
 <!-- 13 -->
 <g id="node14" class="node">
 <title>13</title>
-<path fill="none" stroke="#bed856" stroke-width="2" d="M260.88,-252C260.88,-252 205.12,-252 205.12,-252 199.12,-252 193.12,-246 193.12,-240 193.12,-240 193.12,-228 193.12,-228 193.12,-222 199.12,-216 205.12,-216 205.12,-216 260.88,-216 260.88,-216 266.88,-216 272.88,-222 272.88,-228 272.88,-228 272.88,-240 272.88,-240 272.88,-246 266.88,-252 260.88,-252"/>
+<path fill="none" stroke="black" stroke-width="2" d="M260.88,-252C260.88,-252 205.12,-252 205.12,-252 199.12,-252 193.12,-246 193.12,-240 193.12,-240 193.12,-228 193.12,-228 193.12,-222 199.12,-216 205.12,-216 205.12,-216 260.88,-216 260.88,-216 266.88,-216 272.88,-222 272.88,-228 272.88,-228 272.88,-240 272.88,-240 272.88,-246 266.88,-252 260.88,-252"/>
 <text text-anchor="middle" x="233" y="-230.12" font-family="sans" font-size="10.00">qc_read_depth</text>
 </g>
 <!-- 6&#45;&gt;13 -->
@@ -156,7 +156,7 @@
 <!-- 14 -->
 <g id="node15" class="node">
 <title>14</title>
-<path fill="none" stroke="#d8d356" stroke-width="2" d="M342,-396C342,-396 260,-396 260,-396 254,-396 248,-390 248,-384 248,-384 248,-372 248,-372 248,-366 254,-360 260,-360 260,-360 342,-360 342,-360 348,-360 354,-366 354,-372 354,-372 354,-384 354,-384 354,-390 348,-396 342,-396"/>
+<path fill="none" stroke="black" stroke-width="2" d="M342,-396C342,-396 260,-396 260,-396 254,-396 248,-390 248,-384 248,-384 248,-372 248,-372 248,-366 254,-360 260,-360 260,-360 342,-360 342,-360 348,-360 354,-366 354,-372 354,-372 354,-384 354,-384 354,-390 348,-396 342,-396"/>
 <text text-anchor="middle" x="301" y="-374.12" font-family="sans" font-size="10.00">qc_allelic_imbalance</text>
 </g>
 <!-- 6&#45;&gt;14 -->
@@ -168,7 +168,7 @@
 <!-- 16 -->
 <g id="node17" class="node">
 <title>16</title>
-<path fill="none" stroke="#9fd856" stroke-width="2" d="M426.75,-396C426.75,-396 385.25,-396 385.25,-396 379.25,-396 373.25,-390 373.25,-384 373.25,-384 373.25,-372 373.25,-372 373.25,-366 379.25,-360 385.25,-360 385.25,-360 426.75,-360 426.75,-360 432.75,-360 438.75,-366 438.75,-372 438.75,-372 438.75,-384 438.75,-384 438.75,-390 432.75,-396 426.75,-396"/>
+<path fill="none" stroke="black" stroke-width="2" d="M426.75,-396C426.75,-396 385.25,-396 385.25,-396 379.25,-396 373.25,-390 373.25,-384 373.25,-384 373.25,-372 373.25,-372 373.25,-366 379.25,-360 385.25,-360 385.25,-360 426.75,-360 426.75,-360 432.75,-360 438.75,-366 438.75,-372 438.75,-372 438.75,-384 438.75,-384 438.75,-390 432.75,-396 426.75,-396"/>
 <text text-anchor="middle" x="406" y="-374.12" font-family="sans" font-size="10.00">qc_indmiss</text>
 </g>
 <!-- 6&#45;&gt;16 -->
@@ -180,17 +180,17 @@
 <!-- 7 -->
 <g id="node8" class="node">
 <title>7</title>
-<path fill="none" stroke="#5692d8" stroke-width="2" d="M102,-540C102,-540 38,-540 38,-540 32,-540 26,-534 26,-528 26,-528 26,-516 26,-516 26,-510 32,-504 38,-504 38,-504 102,-504 102,-504 108,-504 114,-510 114,-516 114,-516 114,-528 114,-528 114,-534 108,-540 102,-540"/>
+<path fill="none" stroke="black" stroke-width="2" d="M102,-540C102,-540 38,-540 38,-540 32,-540 26,-534 26,-528 26,-528 26,-516 26,-516 26,-510 32,-504 38,-504 38,-504 102,-504 102,-504 108,-504 114,-510 114,-516 114,-516 114,-528 114,-528 114,-534 108,-540 102,-540"/>
 <text text-anchor="middle" x="70" y="-518.12" font-family="sans" font-size="10.00">extract_samples</text>
 </g>
 <!-- 7&#45;&gt;2 -->
-<g id="edge12" class="edge">
+<g id="edge7" class="edge">
 <title>7&#45;&gt;2</title>
-<path fill="none" stroke="grey" stroke-width="2" d="M54.46,-503.11C33.84,-477.46 0,-427.92 0,-379 0,-379 0,-379 0,-305 0,-260.47 11.01,-243.53 46,-216 89.32,-181.91 151.43,-169.34 198.11,-164.9"/>
-<polygon fill="grey" stroke="grey" stroke-width="2" points="198.14,-168.41 207.82,-164.1 197.57,-161.43 198.14,-168.41"/>
+<path fill="none" stroke="grey" stroke-width="2" d="M54.46,-503.11C33.84,-477.46 0,-427.92 0,-379 0,-379 0,-379 0,-305 0,-260.47 11.01,-243.53 46,-216 95.62,-176.96 169.9,-166.14 217.4,-163.44"/>
+<polygon fill="grey" stroke="grey" stroke-width="2" points="217.48,-166.94 227.31,-163 217.17,-159.94 217.48,-166.94"/>
 </g>
 <!-- 7&#45;&gt;6 -->
-<g id="edge17" class="edge">
+<g id="edge18" class="edge">
 <title>7&#45;&gt;6</title>
 <path fill="none" stroke="grey" stroke-width="2" d="M103.14,-503.15C120.05,-494.05 140.78,-482.89 158.72,-473.23"/>
 <polygon fill="grey" stroke="grey" stroke-width="2" points="160.22,-476.39 167.37,-468.57 156.9,-470.23 160.22,-476.39"/>
@@ -198,11 +198,11 @@
 <!-- 8 -->
 <g id="node9" class="node">
 <title>8</title>
-<path fill="none" stroke="#d87556" stroke-width="2" d="M221.12,-540C221.12,-540 178.88,-540 178.88,-540 172.88,-540 166.88,-534 166.88,-528 166.88,-528 166.88,-516 166.88,-516 166.88,-510 172.88,-504 178.88,-504 178.88,-504 221.12,-504 221.12,-504 227.12,-504 233.12,-510 233.12,-516 233.12,-516 233.12,-528 233.12,-528 233.12,-534 227.12,-540 221.12,-540"/>
+<path fill="none" stroke="black" stroke-width="2" d="M221.12,-540C221.12,-540 178.88,-540 178.88,-540 172.88,-540 166.88,-534 166.88,-528 166.88,-528 166.88,-516 166.88,-516 166.88,-510 172.88,-504 178.88,-504 178.88,-504 221.12,-504 221.12,-504 227.12,-504 233.12,-510 233.12,-516 233.12,-516 233.12,-528 233.12,-528 233.12,-534 227.12,-540 221.12,-540"/>
 <text text-anchor="middle" x="200" y="-518.12" font-family="sans" font-size="10.00">index_fasta</text>
 </g>
 <!-- 8&#45;&gt;6 -->
-<g id="edge18" class="edge">
+<g id="edge17" class="edge">
 <title>8&#45;&gt;6</title>
 <path fill="none" stroke="grey" stroke-width="2" d="M200,-503.34C200,-496.75 200,-489.08 200,-481.67"/>
 <polygon fill="grey" stroke="grey" stroke-width="2" points="203.5,-481.93 200,-471.93 196.5,-481.93 203.5,-481.93"/>
@@ -214,28 +214,28 @@
 <polygon fill="grey" stroke="grey" stroke-width="2" points="437.5,-50 434,-40 430.5,-50 437.5,-50"/>
 </g>
 <!-- 9&#45;&gt;2 -->
-<g id="edge7" class="edge">
+<g id="edge13" class="edge">
 <title>9&#45;&gt;2</title>
-<path fill="none" stroke="grey" stroke-width="2" d="M390.41,-215.15C368.58,-206.22 341.92,-195.31 318.63,-185.77"/>
-<polygon fill="grey" stroke="grey" stroke-width="2" points="320.19,-182.63 309.61,-182.08 317.54,-189.11 320.19,-182.63"/>
+<path fill="none" stroke="grey" stroke-width="2" d="M390.41,-215.15C365.15,-204.82 333.41,-191.82 307.93,-181.39"/>
+<polygon fill="grey" stroke="grey" stroke-width="2" points="309.37,-178.2 298.79,-177.65 306.71,-184.68 309.37,-178.2"/>
 </g>
 <!-- 10&#45;&gt;2 -->
-<g id="edge13" class="edge">
+<g id="edge11" class="edge">
 <title>10&#45;&gt;2</title>
-<path fill="none" stroke="grey" stroke-width="2" d="M50.87,-287.06C47.46,-267.31 45.51,-235.75 62,-216 79.43,-195.12 146.02,-180.46 197.83,-171.93"/>
-<polygon fill="grey" stroke="grey" stroke-width="2" points="198.33,-175.39 207.65,-170.36 197.23,-168.48 198.33,-175.39"/>
+<path fill="none" stroke="grey" stroke-width="2" d="M50.87,-287.06C47.46,-267.31 45.51,-235.75 62,-216 81.72,-192.38 164.38,-176.71 217.36,-168.88"/>
+<polygon fill="grey" stroke="grey" stroke-width="2" points="217.73,-172.36 227.13,-167.48 216.74,-165.43 217.73,-172.36"/>
 </g>
 <!-- 11&#45;&gt;2 -->
-<g id="edge10" class="edge">
+<g id="edge12" class="edge">
 <title>11&#45;&gt;2</title>
-<path fill="none" stroke="grey" stroke-width="2" d="M138.11,-217.98C159.19,-208.7 186.66,-196.61 210.48,-186.12"/>
-<polygon fill="grey" stroke="grey" stroke-width="2" points="211.67,-189.42 219.41,-182.19 208.85,-183.01 211.67,-189.42"/>
+<path fill="none" stroke="grey" stroke-width="2" d="M138.11,-217.98C161.58,-207.65 193,-193.82 218.45,-182.61"/>
+<polygon fill="grey" stroke="grey" stroke-width="2" points="219.52,-185.97 227.27,-178.73 216.7,-179.56 219.52,-185.97"/>
 </g>
 <!-- 12&#45;&gt;2 -->
-<g id="edge11" class="edge">
+<g id="edge9" class="edge">
 <title>12&#45;&gt;2</title>
-<path fill="none" stroke="grey" stroke-width="2" d="M164.97,-287.09C165.76,-267.95 169.47,-237.46 184,-216 191.58,-204.81 202.38,-195.35 213.58,-187.67"/>
-<polygon fill="grey" stroke="grey" stroke-width="2" points="215.21,-190.78 221.79,-182.47 211.47,-184.87 215.21,-190.78"/>
+<path fill="none" stroke="grey" stroke-width="2" d="M164.97,-287.09C165.76,-267.95 169.47,-237.46 184,-216 192.82,-202.96 206.03,-192.29 219.13,-184.02"/>
+<polygon fill="grey" stroke="grey" stroke-width="2" points="220.54,-187.25 227.4,-179.18 217,-181.21 220.54,-187.25"/>
 </g>
 <!-- 13&#45;&gt;2 -->
 <g id="edge6" class="edge">
@@ -244,7 +244,7 @@
 <polygon fill="grey" stroke="grey" stroke-width="2" points="253.41,-194.25 254.14,-183.68 246.98,-191.5 253.41,-194.25"/>
 </g>
 <!-- 14&#45;&gt;2 -->
-<g id="edge8" class="edge">
+<g id="edge10" class="edge">
 <title>14&#45;&gt;2</title>
 <path fill="none" stroke="grey" stroke-width="2" d="M300.23,-359.38C298.63,-329.53 294.04,-267.24 282,-216 280.22,-208.41 277.7,-200.41 275.08,-192.99"/>
 <polygon fill="grey" stroke="grey" stroke-width="2" points="278.38,-191.82 271.6,-183.68 271.83,-194.27 278.38,-191.82"/>
@@ -252,11 +252,11 @@
 <!-- 15 -->
 <g id="node16" class="node">
 <title>15</title>
-<path fill="none" stroke="#56d863" stroke-width="2" d="M473.12,-324C473.12,-324 340.88,-324 340.88,-324 334.88,-324 328.88,-318 328.88,-312 328.88,-312 328.88,-300 328.88,-300 328.88,-294 334.88,-288 340.88,-288 340.88,-288 473.12,-288 473.12,-288 479.12,-288 485.12,-294 485.12,-300 485.12,-300 485.12,-312 485.12,-312 485.12,-318 479.12,-324 473.12,-324"/>
+<path fill="none" stroke="black" stroke-width="2" d="M473.12,-324C473.12,-324 340.88,-324 340.88,-324 334.88,-324 328.88,-318 328.88,-312 328.88,-312 328.88,-300 328.88,-300 328.88,-294 334.88,-288 340.88,-288 340.88,-288 473.12,-288 473.12,-288 479.12,-288 485.12,-294 485.12,-300 485.12,-300 485.12,-312 485.12,-312 485.12,-318 479.12,-324 473.12,-324"/>
 <text text-anchor="middle" x="407" y="-302.12" font-family="sans" font-size="10.00">process_individual_missingness</text>
 </g>
 <!-- 15&#45;&gt;2 -->
-<g id="edge9" class="edge">
+<g id="edge8" class="edge">
 <title>15&#45;&gt;2</title>
 <path fill="none" stroke="grey" stroke-width="2" d="M388.76,-287.02C363.88,-262.48 319.08,-218.3 290.22,-189.84"/>
 <polygon fill="grey" stroke="grey" stroke-width="2" points="292.82,-187.49 283.25,-182.96 287.91,-192.48 292.82,-187.49"/>
diff --git a/docs/preprocessing.md b/docs/preprocessing.md
index b9564cf1..c9c3bc79 100644
--- a/docs/preprocessing.md
+++ b/docs/preprocessing.md
@@ -3,7 +3,7 @@
 The DeepRVAT preprocessing pipeline is based on [snakemake](https://snakemake.readthedocs.io/en/stable/) it uses
 [bcftools+samstools](https://www.htslib.org/) and a [python script](https://github.com/PMBio/deeprvat/blob/main/deeprvat/preprocessing/preprocess.py) preprocessing.py.
 
-![DeepRVAT preprocessing pipeline](_static/preprocess_rulegraph_no_qc.svg)
+![DeepRVAT preprocessing pipeline](_static/preprocess_no_qc_rulegraph.svg)
 
 ## Output
 
@@ -126,7 +126,7 @@ we used when we wrote the paper. The qc is specific to the UKBB data, so if you
 pipeline without qc.
 
 ### Run the preprocess pipeline with example data and qc
-![DeepRVAT preprocessing pipeline](_static/preprocess_rulegraph_with_qc.svg)
+![DeepRVAT preprocessing pipeline](_static/preprocess_with_qc_rulegraph.svg)
 
 *The vcf files in the example data folder was generated using [fake-vcf](https://github.com/endast/fake-vcf) (with some
 manual editing).
@@ -170,7 +170,7 @@ total 48
 
 ### Run the preprocess pipeline with example data and no qc
 
-![DeepRVAT preprocessing pipeline](_static/preprocess_rulegraph_no_qc.svg)
+![DeepRVAT preprocessing pipeline](_static/preprocess_no_qc_rulegraph.svg)
 
 *The vcf files in the example data folder was generated using [fake-vcf](https://github.com/endast/fake-vcf) (with some
 manual editing).
diff --git a/pipelines/preprocess_no_qc.snakefile b/pipelines/preprocess_no_qc.snakefile
index 4675972f..43cd58c8 100644
--- a/pipelines/preprocess_no_qc.snakefile
+++ b/pipelines/preprocess_no_qc.snakefile
@@ -3,17 +3,17 @@ include: "preprocessing/preprocess.snakefile"
 
 rule all:
     input:
-        preprocessed_dir / "genotypes.h5",
-        norm_variants_dir / "variants.tsv.gz",
-        variants=norm_variants_dir / "variants.parquet",
+        combined_genotypes=rules.combine_genotypes.output,
+        variants_tsv=rules.add_variant_ids.output.variants,
+        variants_parquet=rules.create_parquet_variant_ids.output.variants,
 
 
-rule preprocess_no_qc:
+rule preprocess:
     input:
-        variants=norm_variants_dir / "variants.tsv.gz",
-        variants_parquet=norm_variants_dir / "variants.parquet",
-        samples=norm_dir / "samples_chr.csv",
-        sparse_tg=expand(sparse_dir / "{vcf_stem}.tsv.gz", vcf_stem=vcf_stems),
+        variants=rules.add_variant_ids.output.variants,
+        variants_parquet=rules.create_parquet_variant_ids.output.variants,
+        samples=rules.extract_samples.output,
+        sparse_tg=expand(rules.sparsify.output.tsv, vcf_stem=vcf_stems),
     output:
         expand(preprocessed_dir / "genotypes_chr{chr}.h5", chr=chromosomes),
     shell:
@@ -27,6 +27,6 @@ rule preprocess_no_qc:
                 "{input.variants_parquet}",
                 "{input.samples}",
                 f"{sparse_dir}",
-                f"{preprocessed_dir / 'genotypes'}",
+                f"{preprocessed_dir/ 'genotypes'}",
             ]
         )
diff --git a/pipelines/preprocess_with_qc.snakefile b/pipelines/preprocess_with_qc.snakefile
index 70b778bb..630c85a1 100644
--- a/pipelines/preprocess_with_qc.snakefile
+++ b/pipelines/preprocess_with_qc.snakefile
@@ -4,28 +4,26 @@ include: "preprocessing/qc.snakefile"
 
 rule all:
     input:
-        preprocessed_dir / "genotypes.h5",
-        norm_variants_dir / "variants.tsv.gz",
-        variants=norm_variants_dir / "variants.parquet",
+        combined_genotypes=rules.combine_genotypes.output,
+        variants_tsv=rules.add_variant_ids.output.variants,
+        variants_parquet=rules.create_parquet_variant_ids.output.variants,
 
 
-rule preprocess_with_qc:
+rule preprocess:
     input:
-        variants=norm_variants_dir / "variants.tsv.gz",
-        variants_parquet=norm_variants_dir / "variants.parquet",
-        samples=norm_dir / "samples_chr.csv",
-        sparse_tg=expand(sparse_dir / "{vcf_stem}.tsv.gz",vcf_stem=vcf_stems),
-        qc_varmiss=expand(qc_varmiss_dir / "{vcf_stem}.tsv.gz",vcf_stem=vcf_stems),
-        qc_hwe=expand(qc_hwe_dir / "{vcf_stem}.tsv.gz",vcf_stem=vcf_stems),
-        qc_read_depth=expand(
-            qc_read_depth_dir / "{vcf_stem}.tsv.gz",vcf_stem=vcf_stems
-        ),
+        variants=rules.add_variant_ids.output.variants,
+        variants_parquet=rules.create_parquet_variant_ids.output.variants,
+        samples=rules.extract_samples.output,
+        sparse_tg=expand(rules.sparsify.output.tsv, vcf_stem=vcf_stems),
+        qc_varmiss=expand(rules.qc_varmiss.output, vcf_stem=vcf_stems),
+        qc_hwe=expand(rules.qc_hwe.output, vcf_stem=vcf_stems),
+        qc_read_depth=expand(rules.qc_read_depth.output, vcf_stem=vcf_stems),
         qc_allelic_imbalance=expand(
-            qc_allelic_imbalance_dir / "{vcf_stem}.tsv.gz",vcf_stem=vcf_stems
+            rules.qc_allelic_imbalance.output, vcf_stem=vcf_stems
         ),
-        qc_indmiss_samples=qc_filtered_samples_dir / "indmiss_samples.csv",
+        qc_indmiss_samples=rules.process_individual_missingness.output,
     output:
-        expand(preprocessed_dir / "genotypes_chr{chr}.h5",chr=chromosomes),
+        expand(preprocessed_dir / "genotypes_chr{chr}.h5", chr=chromosomes),
     shell:
         " ".join(
             [
@@ -42,6 +40,6 @@ rule preprocess_with_qc:
                 "{input.variants_parquet}",
                 "{input.samples}",
                 f"{sparse_dir}",
-                f"{preprocessed_dir / 'genotypes'}",
+                f"{preprocessed_dir/ 'genotypes'}",
             ]
         )
diff --git a/pipelines/preprocessing/preprocess.snakefile b/pipelines/preprocessing/preprocess.snakefile
index cad20b3c..69edc18d 100644
--- a/pipelines/preprocessing/preprocess.snakefile
+++ b/pipelines/preprocessing/preprocess.snakefile
@@ -50,10 +50,17 @@ rule combine_genotypes:
     shell:
         f"{preprocessing_cmd} combine-genotypes {{input}} {{output}}"
 
+rule extract_samples:
+    input:
+        vcf_files,
+    output:
+        norm_dir / "samples_chr.csv",
+    shell:
+        f"{load_bcftools} bcftools query --list-samples {{input}} > {{output}}"
 
 rule normalize:
     input:
-        samplefile=norm_dir / "samples_chr.csv",
+        samplefile=rules.extract_samples.output,
         fasta=fasta_file,
         fastaindex=fasta_index_file,
     params:
@@ -77,7 +84,7 @@ rule index_fasta:
 
 rule sparsify:
     input:
-        bcf=bcf_dir / "{vcf_stem}.bcf",
+        bcf=rules.normalize.output.bcf_file
     output:
         tsv=sparse_dir / "{vcf_stem}.tsv.gz",
     resources:
@@ -89,7 +96,7 @@ rule sparsify:
 
 rule variants:
     input:
-        bcf=bcf_dir / "{vcf_stem}.bcf",
+        bcf=rules.normalize.output.bcf_file,
     output:
         norm_variants_dir / "{vcf_stem}.tsv.gz",
     resources:
@@ -100,7 +107,7 @@ rule variants:
 
 rule concatenate_variants:
     input:
-        expand(norm_variants_dir / "{vcf_stem}.tsv.gz",vcf_stem=vcf_stems),
+        expand(rules.variants.output,vcf_stem=vcf_stems),
     output:
         norm_variants_dir / "variants_no_id.tsv.gz",
     resources:
@@ -111,7 +118,7 @@ rule concatenate_variants:
 
 rule add_variant_ids:
     input:
-        norm_variants_dir / "variants_no_id.tsv.gz",
+        rules.concatenate_variants.output
     output:
         variants=norm_variants_dir / "variants.tsv.gz",
         duplicates=qc_duplicate_vars_dir / "duplicates.tsv",
@@ -123,7 +130,7 @@ rule add_variant_ids:
 
 rule create_parquet_variant_ids:
     input:
-        norm_variants_dir / "variants_no_id.tsv.gz",
+        rules.concatenate_variants.output
     output:
         variants=norm_variants_dir / "variants.parquet",
         duplicates=qc_duplicate_vars_dir / "duplicates.parquet",
@@ -131,13 +138,3 @@ rule create_parquet_variant_ids:
         mem_mb=2048,
     shell:
         f"{preprocessing_cmd} add-variant-ids {{input}} {{output.variants}} {{output.duplicates}}"
-
-
-rule extract_samples:
-    input:
-        vcf_files,
-    output:
-        norm_dir / "samples_chr.csv",
-    shell:
-        f"{load_bcftools} bcftools query --list-samples {{input}} > {{output}}"
-