Compare commits

..

No commits in common. "4043a8a72bba54200f6f512e8b91d18d00e891c8" and "30807f2bd00ba1950d142aced92fa9e91c06e342" have entirely different histories.

4 changed files with 145 additions and 277 deletions

View File

@ -6,12 +6,12 @@
id="Layer_1" id="Layer_1"
x="0px" x="0px"
y="0px" y="0px"
width="211.93124mm" width="210mm"
height="111.38958mm" height="297mm"
viewBox="0 0 800.99999 420.99999" viewBox="0 0 793.7008 1122.5197"
enable-background="new 0 0 576 360" enable-background="new 0 0 576 360"
xml:space="preserve" xml:space="preserve"
sodipodi:docname="Evolution_fate_duplicate_genes.svg" sodipodi:docname="Evolution_fate_duplicate_genes_-_vector.svg"
inkscape:version="1.2.2 (b0a8486541, 2022-12-01)" inkscape:version="1.2.2 (b0a8486541, 2022-12-01)"
inkscape:export-filename="Evolution_fate_duplicate_genes.pdf" inkscape:export-filename="Evolution_fate_duplicate_genes.pdf"
inkscape:export-xdpi="96" inkscape:export-xdpi="96"
@ -152,23 +152,23 @@
inkscape:pagecheckerboard="0" inkscape:pagecheckerboard="0"
inkscape:deskcolor="#d1d1d1" inkscape:deskcolor="#d1d1d1"
showgrid="true" showgrid="true"
inkscape:zoom="0.5659722" inkscape:zoom="1.1319444"
inkscape:cx="295.0675" inkscape:cx="468.22086"
inkscape:cy="190.82209" inkscape:cy="138.69939"
inkscape:window-width="1280" inkscape:window-width="1920"
inkscape:window-height="995" inkscape:window-height="1007"
inkscape:window-x="1920" inkscape:window-x="0"
inkscape:window-y="0" inkscape:window-y="0"
inkscape:window-maximized="1" inkscape:window-maximized="1"
inkscape:current-layer="Layer_1" inkscape:current-layer="Layer_1"
inkscape:document-units="mm"><inkscape:grid inkscape:document-units="mm"><inkscape:grid
type="xygrid" type="xygrid"
id="grid2647" id="grid2647"
originx="0.49999999" originx="0"
originy="0.49999998" /></sodipodi:namedview> originy="0" /></sodipodi:namedview>
<g <g
id="g67" id="g67"
transform="translate(106.977,32.725)"> transform="translate(106.477,32.225)">
<linearGradient <linearGradient
id="SVGID_1_" id="SVGID_1_"
gradientUnits="userSpaceOnUse" gradientUnits="userSpaceOnUse"
@ -280,7 +280,7 @@
<g <g
id="g34"> id="g34">
<polygon <polygon
points="235.433,18.441 232.954,14.174 243.4,18.441 232.954,22.71 " points="243.4,18.441 232.954,22.71 235.433,18.441 232.954,14.174 "
id="polygon32" /> id="polygon32" />
</g> </g>
</g> </g>
@ -605,7 +605,7 @@
</g> </g>
<g <g
id="g134" id="g134"
transform="translate(106.977,32.725)"> transform="translate(106.477,32.225)">
<linearGradient <linearGradient
id="SVGID_5_" id="SVGID_5_"
gradientUnits="userSpaceOnUse" gradientUnits="userSpaceOnUse"
@ -717,7 +717,7 @@
<g <g
id="g101"> id="g101">
<polygon <polygon
points="235.433,109.107 232.954,104.84 243.4,109.107 232.954,113.377 " points="243.4,109.107 232.954,113.377 235.433,109.107 232.954,104.84 "
id="polygon99" /> id="polygon99" />
</g> </g>
</g> </g>
@ -1041,8 +1041,8 @@
</g> </g>
</g> </g>
<rect <rect
x="488.81104" x="488.31104"
y="44.583" y="44.083"
fill="none" fill="none"
width="191" width="191"
height="31.433001" height="31.433001"
@ -1050,23 +1050,23 @@
<text <text
id="text142" id="text142"
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:16px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal" style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:16px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal"
x="488.81104" x="488.31104"
y="55.223"><tspan y="54.723"><tspan
x="488.81104" x="488.31104"
y="55.223" y="54.723"
font-family="'Verdana'" font-family="'Verdana'"
font-size="14" font-size="14"
id="tspan138" id="tspan138"
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:16px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal">Gene with four</tspan><tspan style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:16px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal">Gene with four</tspan><tspan
x="488.81104" x="488.31104"
y="72.023003" y="71.523003"
font-family="'Verdana'" font-family="'Verdana'"
font-size="14" font-size="14"
id="tspan140" id="tspan140"
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:16px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal">different functions</tspan></text> style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:16px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal">different functions</tspan></text>
<g <g
id="g152" id="g152"
transform="translate(106.977,32.725)"> transform="translate(106.477,32.225)">
<g <g
id="g150"> id="g150">
@ -1084,14 +1084,14 @@
<g <g
id="g148"> id="g148">
<polygon <polygon
points="287.833,77.152 293.523,73.847 287.833,87.775 282.142,73.847 " points="287.833,87.775 282.142,73.847 287.833,77.152 293.523,73.847 "
id="polygon146" /> id="polygon146" />
</g> </g>
</g> </g>
</g> </g>
<g <g
id="g219" id="g219"
transform="translate(106.977,32.725)"> transform="translate(106.477,32.225)">
<linearGradient <linearGradient
id="SVGID_9_" id="SVGID_9_"
gradientUnits="userSpaceOnUse" gradientUnits="userSpaceOnUse"
@ -1203,7 +1203,7 @@
<g <g
id="g186"> id="g186">
<polygon <polygon
points="235.433,157.411 232.954,153.144 243.4,157.411 232.954,161.681 " points="243.4,157.411 232.954,161.681 235.433,157.411 232.954,153.144 "
id="polygon184" /> id="polygon184" />
</g> </g>
</g> </g>
@ -1533,8 +1533,8 @@
<rect <rect
x="411.32098" x="410.82098"
y="97.583" y="97.083"
fill="none" fill="none"
width="196.65601" width="196.65601"
height="15.716" height="15.716"
@ -1544,12 +1544,12 @@
font-size="14" font-size="14"
id="text545" id="text545"
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:16px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal" style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:16px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal"
x="411.3208" x="410.8208"
y="108.223">Duplication</text> y="107.723">Duplication</text>
<rect <rect
x="503.56" x="503.06"
y="215.40001" y="214.90001"
fill="none" fill="none"
width="169.136" width="169.136"
height="15.717" height="15.717"
@ -1559,14 +1559,14 @@
font-size="14" font-size="14"
id="text559" id="text559"
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:16px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal" style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:16px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal"
x="503.55902" x="503.05902"
y="226.03951">Divergence</text> y="225.53951">Divergence</text>
<path <path
fill="none" fill="none"
stroke="#000000" stroke="#000000"
stroke-width="2" stroke-width="2"
stroke-miterlimit="10" stroke-miterlimit="10"
d="m 394.81,226.225 c 0,4.053 6.038,7.333 13.5,7.333 h 255.803 c 7.463,0 13.5,3.28 13.5,7.333" d="m 394.31,225.725 c 0,4.053 6.038,7.333 13.5,7.333 h 255.803 c 7.463,0 13.5,3.28 13.5,7.333"
id="path561" id="path561"
sodipodi:nodetypes="cssc" /> sodipodi:nodetypes="cssc" />
<path <path
@ -1574,12 +1574,12 @@
stroke="#000000" stroke="#000000"
stroke-width="2" stroke-width="2"
stroke-miterlimit="10" stroke-miterlimit="10"
d="m 150.31,240.891 c 0,-4.053 6.038,-7.333 13.5,-7.333 h 217.5 c 7.463,0 13.5,-3.28 13.5,-7.333" d="m 149.81,240.391 c 0,-4.053 6.038,-7.333 13.5,-7.333 h 217.5 c 7.463,0 13.5,-3.28 13.5,-7.333"
id="path563" id="path563"
sodipodi:nodetypes="cssc" /> sodipodi:nodetypes="cssc" />
<g <g
id="g573" id="g573"
transform="translate(192.977,32.725)"> transform="translate(192.477,32.225)">
<g <g
id="g571"> id="g571">
@ -1597,14 +1597,14 @@
<g <g
id="g569"> id="g569">
<polygon <polygon
points="484.637,226.775 478.945,212.847 484.637,216.151 490.327,212.847 " points="484.637,216.151 490.327,212.847 484.637,226.775 478.945,212.847 "
id="polygon567" /> id="polygon567" />
</g> </g>
</g> </g>
</g> </g>
<g <g
id="g583" id="g583"
transform="translate(58.977,32.725)"> transform="translate(58.477,32.225)">
<g <g
id="g581"> id="g581">
@ -1622,14 +1622,14 @@
<g <g
id="g579"> id="g579">
<polygon <polygon
points="91.333,226.775 85.641,212.847 91.333,216.151 97.023,212.847 " points="91.333,216.151 97.023,212.847 91.333,226.775 85.641,212.847 "
id="polygon577" /> id="polygon577" />
</g> </g>
</g> </g>
</g> </g>
<rect <rect
x="107.97701" x="107.47701"
y="371.39999" y="370.89999"
fill="none" fill="none"
width="179.33299" width="179.33299"
height="15.717" height="15.717"
@ -1639,11 +1639,11 @@
font-size="14" font-size="14"
id="text587" id="text587"
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:16px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal" style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:16px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal"
x="244.30266" x="243.80266"
y="387.13199">Subfunctionalization</text> y="386.63199">Subfunctionalization</text>
<rect <rect
x="305.311" x="304.811"
y="371.39999" y="370.89999"
fill="none" fill="none"
width="179.334" width="179.334"
height="15.717" height="15.717"
@ -1653,11 +1653,11 @@
font-size="14" font-size="14"
id="text591" id="text591"
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:16px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal" style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:16px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal"
x="417.67331" x="417.17331"
y="387.15601">Neofunctionalization</text> y="386.65601">Neofunctionalization</text>
<rect <rect
x="498.64301" x="498.14301"
y="371.39999" y="370.89999"
fill="none" fill="none"
width="183.334" width="183.334"
height="15.717" height="15.717"
@ -1667,11 +1667,11 @@
font-size="14" font-size="14"
id="text595" id="text595"
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:16px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal" style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:16px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal"
x="592.5" x="592"
y="385.5">Degeneration/Gene loss</text> y="385">Degeneration/Gene loss</text>
<g <g
id="g3995" id="g3995"
transform="translate(112.977,32.725)"><g transform="translate(112.477,32.225)"><g
id="g2911" id="g2911"
transform="translate(82.74739)"><g transform="translate(82.74739)"><g
id="g286"> id="g286">
@ -1786,7 +1786,7 @@
<g <g
id="g253"> id="g253">
<polygon <polygon
points="235.433,246.546 232.954,242.278 243.4,246.546 232.954,250.815 " points="243.4,246.546 232.954,250.815 235.433,246.546 232.954,242.278 "
id="polygon251" /> id="polygon251" />
</g> </g>
</g> </g>
@ -2173,7 +2173,7 @@
<g <g
id="g306"> id="g306">
<polygon <polygon
points="235.433,299.715 232.954,295.447 243.4,299.715 232.954,303.984 " points="243.4,299.715 232.954,303.984 235.433,299.715 232.954,295.447 "
id="polygon304" /> id="polygon304" />
</g> </g>
</g> </g>
@ -2562,7 +2562,7 @@
<g <g
id="g359"> id="g359">
<polygon <polygon
points="46.4,246.546 35.954,250.815 38.433,246.546 35.954,242.278 " points="38.433,246.546 35.954,242.278 46.4,246.546 35.954,250.815 "
id="polygon357" /> id="polygon357" />
</g> </g>
</g> </g>
@ -2949,7 +2949,7 @@
<g <g
id="g412"> id="g412">
<polygon <polygon
points="46.4,299.715 35.954,303.984 38.433,299.715 35.954,295.447 " points="38.433,299.715 35.954,295.447 46.4,299.715 35.954,303.984 "
id="polygon410" /> id="polygon410" />
</g> </g>
</g> </g>
@ -3386,7 +3386,7 @@
<g <g
id="g479"> id="g479">
<polygon <polygon
points="429.91,250.815 432.39,246.546 429.91,242.278 440.357,246.546 " points="429.91,242.278 440.357,246.546 429.91,250.815 432.39,246.546 "
id="polygon477" /> id="polygon477" />
</g> </g>
</g> </g>
@ -4143,7 +4143,7 @@
<g <g
id="g101-5"> id="g101-5">
<polygon <polygon
points="232.954,104.84 243.4,109.107 232.954,113.377 235.433,109.107 " points="232.954,113.377 235.433,109.107 232.954,104.84 243.4,109.107 "
id="polygon99-6" /> id="polygon99-6" />
</g> </g>
</g> </g>
@ -4579,7 +4579,7 @@
<g <g
id="g186-4"> id="g186-4">
<polygon <polygon
points="232.954,153.144 243.4,157.411 232.954,161.681 235.433,157.411 " points="232.954,161.681 235.433,157.411 232.954,153.144 243.4,157.411 "
id="polygon184-4" /> id="polygon184-4" />
</g> </g>
</g> </g>
@ -4916,10 +4916,10 @@
font-size="14" font-size="14"
id="text4095" id="text4095"
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:16px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal" style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:16px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal"
x="49.971992" x="49.471992"
y="385.5">Functional redoundancy</text><g y="385">Functional redoundancy</text><g
id="g4702" id="g4702"
transform="translate(-17.971606,0.5)"><g transform="translate(-18.471606)"><g
id="g555" id="g555"
transform="matrix(1,0,0,0.7957841,29.4895,79.036561)"> transform="matrix(1,0,0,0.7957841,29.4895,79.036561)">
<g <g
@ -4939,7 +4939,7 @@
<g <g
id="g551"> id="g551">
<polygon <polygon
points="282.142,212.847 287.833,216.152 293.523,212.847 287.833,226.775 " points="293.523,212.847 287.833,226.775 282.142,212.847 287.833,216.152 "
id="polygon549" /> id="polygon549" />
</g> </g>
</g> </g>
@ -4963,7 +4963,7 @@
<g <g
id="g4686"> id="g4686">
<polygon <polygon
points="287.833,216.152 293.523,212.847 287.833,226.775 282.142,212.847 " points="287.833,226.775 282.142,212.847 287.833,216.152 293.523,212.847 "
id="polygon4684" /> id="polygon4684" />
</g> </g>
</g> </g>

Before

Width:  |  Height:  |  Size: 201 KiB

After

Width:  |  Height:  |  Size: 201 KiB

View File

@ -1,117 +0,0 @@
<?xml version="1.0" encoding="UTF-8"?>
<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" width="341.353pt" height="96.089pt" viewBox="0 0 341.353 96.089" version="1.1">
<defs>
<g>
<symbol overflow="visible" id="glyph0-0">
<path style="stroke:none;" d=""/>
</symbol>
<symbol overflow="visible" id="glyph0-1">
<path style="stroke:none;" d="M 0.953125 -6.9375 L -2.640625 -3.921875 L -1.75 -2.578125 L -1.5625 -2.75 C -2.25 -3.734375 -2.1875 -3.96875 -1.375 -4.65625 C -1.265625 -4.734375 -1.109375 -4.875 -1.046875 -4.921875 C -0.921875 -5 -0.875 -4.9375 -0.765625 -4.8125 L 1.546875 -2.046875 C 1.703125 -1.875 1.765625 -1.796875 1.203125 -1.328125 L 0.984375 -1.140625 L 1.140625 -0.953125 C 1.390625 -1.203125 1.890625 -1.625 2.15625 -1.859375 C 2.4375 -2.09375 2.921875 -2.5 3.203125 -2.6875 L 3.046875 -2.875 L 2.828125 -2.6875 C 2.28125 -2.21875 2.21875 -2.296875 2.0625 -2.46875 L -0.25 -5.234375 C -0.359375 -5.359375 -0.40625 -5.421875 -0.3125 -5.546875 C -0.265625 -5.578125 -0.109375 -5.71875 0 -5.8125 C 0.296875 -6.0625 0.53125 -6.25 0.796875 -6.3125 C 1.15625 -6.359375 1.484375 -6.0625 1.515625 -6.03125 L 1.90625 -5.65625 L 2.09375 -5.8125 Z M 0.953125 -6.9375 "/>
</symbol>
<symbol overflow="visible" id="glyph0-2">
<path style="stroke:none;" d="M -0.703125 -5.703125 C -0.78125 -5.75 -0.84375 -5.78125 -0.9375 -5.703125 C -1.046875 -5.609375 -1.03125 -5.546875 -1 -5.4375 L 0.390625 -1.28125 C 0.453125 -1.125 0.5625 -0.796875 0.078125 -0.390625 L 0.234375 -0.203125 C 0.40625 -0.359375 0.59375 -0.546875 0.78125 -0.6875 C 0.984375 -0.875 1.40625 -1.171875 1.4375 -1.203125 L 1.28125 -1.390625 C 1.046875 -1.1875 0.796875 -1.171875 0.671875 -1.3125 C 0.640625 -1.359375 0.625 -1.390625 0.609375 -1.453125 L 0.3125 -2.3125 L 1.828125 -3.59375 L 2.796875 -3.09375 C 2.8125 -3.0625 2.875 -3.046875 2.890625 -3.015625 C 3.03125 -2.859375 2.734375 -2.625 2.59375 -2.5 L 2.75 -2.3125 C 3 -2.546875 3.34375 -2.859375 3.53125 -3 C 3.78125 -3.21875 4.203125 -3.53125 4.25 -3.5625 L 4.09375 -3.75 L 4 -3.671875 C 3.640625 -3.375 3.5625 -3.40625 3.375 -3.5 Z M -0.546875 -4.890625 L 1.59375 -3.71875 L 0.234375 -2.578125 Z M -0.546875 -4.890625 "/>
</symbol>
<symbol overflow="visible" id="glyph0-3">
<path style="stroke:none;" d="M 3.09375 -4.375 C 2.890625 -4.609375 2.953125 -4.671875 3.3125 -4.96875 L 3.15625 -5.15625 C 3.109375 -5.109375 2.75 -4.78125 2.484375 -4.5625 C 2.1875 -4.3125 1.796875 -3.984375 1.5 -3.765625 L 1.65625 -3.578125 L 1.859375 -3.734375 C 2.390625 -4.1875 2.453125 -4.109375 2.59375 -3.953125 L 2.890625 -3.59375 C 2.984375 -3.484375 3.15625 -3.28125 2.96875 -2.875 C 2.84375 -2.515625 2.546875 -2.265625 2.46875 -2.203125 C 1.859375 -1.6875 0.59375 -1.234375 -0.578125 -2.625 C -1.765625 -4.046875 -1.015625 -5.203125 -0.5 -5.65625 C 0.015625 -6.078125 0.96875 -6.265625 1.859375 -5.453125 C 1.921875 -5.40625 1.96875 -5.4375 2 -5.46875 C 2.09375 -5.546875 2.078125 -5.59375 1.984375 -5.703125 L 0.9375 -6.9375 C 0.859375 -7.03125 0.8125 -7.09375 0.75 -7.046875 C 0.71875 -7.015625 0.703125 -7 0.71875 -6.875 L 0.78125 -6.25 C 0.28125 -6.296875 -0.265625 -6.1875 -0.734375 -5.796875 C -1.859375 -4.859375 -2.0625 -3.203125 -1.15625 -2.140625 C -0.265625 -1.078125 1.375 -0.96875 2.53125 -1.921875 C 2.828125 -2.1875 3.359375 -2.734375 3.296875 -3.328125 C 3.5 -3.25 3.859375 -3.234375 3.90625 -3.28125 C 3.96875 -3.328125 3.921875 -3.390625 3.84375 -3.46875 Z M 3.09375 -4.375 "/>
</symbol>
<symbol overflow="visible" id="glyph1-0">
<path style="stroke:none;" d=""/>
</symbol>
<symbol overflow="visible" id="glyph1-1">
<path style="stroke:none;" d="M 0.453125 -4.28125 C 0.46875 -4.359375 0.46875 -4.359375 0.453125 -4.390625 L 0.375 -4.484375 L -0.5625 -3.703125 C -0.65625 -3.625 -1.234375 -3.1875 -1.3125 -3.140625 C -1.40625 -3.078125 -1.4375 -3.109375 -1.5 -3.140625 L -1.65625 -3.015625 L -1.078125 -2.03125 L -0.921875 -2.15625 C -0.96875 -2.234375 -1.125 -2.5 -1.09375 -2.625 C -1.078125 -2.640625 -0.71875 -2.953125 -0.65625 -3 L 0.25 -3.765625 C 0.234375 -3.4375 0.203125 -3.0625 0.203125 -2.75 C 0.234375 -1.796875 0.640625 -1.203125 0.84375 -0.953125 C 1.015625 -0.75 1.15625 -0.84375 1.234375 -0.90625 C 1.4375 -1.078125 1.28125 -1.265625 1.25 -1.3125 L 1.1875 -1.390625 C 0.609375 -2.0625 0.40625 -2.609375 0.421875 -3.046875 Z M 0.453125 -4.28125 "/>
</symbol>
<symbol overflow="visible" id="glyph1-2">
<path style="stroke:none;" d="M 0.1875 -2.3125 C 0.546875 -2.625 0.96875 -2.59375 1.28125 -2.21875 C 1.609375 -1.828125 1.546875 -1.421875 1.203125 -1.140625 C 1.15625 -1.109375 0.703125 -0.71875 0.34375 -0.765625 C 0.484375 -0.90625 0.4375 -1.0625 0.359375 -1.15625 C 0.234375 -1.296875 0.046875 -1.296875 -0.09375 -1.1875 C -0.203125 -1.078125 -0.234375 -0.921875 -0.09375 -0.75 C 0.234375 -0.359375 0.8125 -0.546875 1.34375 -1 C 1.96875 -1.515625 2.03125 -2.21875 1.71875 -2.59375 C 1.453125 -2.90625 0.96875 -2.9375 0.453125 -2.671875 C 0.78125 -3.203125 0.65625 -3.59375 0.484375 -3.8125 C 0.21875 -4.125 -0.359375 -4.015625 -0.828125 -3.609375 C -1.3125 -3.21875 -1.53125 -2.71875 -1.234375 -2.375 C -1.09375 -2.1875 -0.890625 -2.25 -0.828125 -2.3125 C -0.71875 -2.40625 -0.6875 -2.59375 -0.796875 -2.734375 C -0.875 -2.8125 -1.015625 -2.875 -1.171875 -2.796875 C -1.15625 -3.09375 -0.8125 -3.390625 -0.734375 -3.46875 C -0.453125 -3.703125 -0.140625 -3.734375 0.078125 -3.46875 C 0.265625 -3.234375 0.421875 -2.765625 0.03125 -2.421875 C -0.078125 -2.328125 -0.078125 -2.3125 -0.1875 -2.21875 C -0.21875 -2.1875 -0.28125 -2.140625 -0.21875 -2.078125 C -0.171875 -2.015625 -0.125 -2.046875 -0.0625 -2.109375 Z M 0.1875 -2.3125 "/>
</symbol>
<symbol overflow="visible" id="glyph2-0">
<path style="stroke:none;" d=""/>
</symbol>
<symbol overflow="visible" id="glyph2-1">
<path style="stroke:none;" d="M 0.953125 -6.9375 L -2.640625 -3.921875 L -1.75 -2.578125 L -1.5625 -2.75 C -2.25 -3.734375 -2.1875 -3.96875 -1.375 -4.65625 C -1.265625 -4.734375 -1.109375 -4.875 -1.046875 -4.921875 C -0.921875 -5 -0.875 -4.9375 -0.765625 -4.8125 L 1.546875 -2.046875 C 1.703125 -1.875 1.765625 -1.796875 1.203125 -1.328125 L 0.984375 -1.140625 L 1.140625 -0.953125 C 1.390625 -1.203125 1.890625 -1.625 2.15625 -1.859375 C 2.4375 -2.09375 2.921875 -2.5 3.203125 -2.6875 L 3.046875 -2.875 L 2.828125 -2.6875 C 2.28125 -2.21875 2.21875 -2.296875 2.0625 -2.46875 L -0.25 -5.234375 C -0.359375 -5.359375 -0.40625 -5.421875 -0.3125 -5.546875 C -0.265625 -5.578125 -0.109375 -5.71875 0 -5.8125 C 0.296875 -6.0625 0.53125 -6.25 0.796875 -6.3125 C 1.15625 -6.359375 1.484375 -6.0625 1.515625 -6.03125 L 1.90625 -5.65625 L 2.09375 -5.8125 Z M 0.953125 -6.9375 "/>
</symbol>
<symbol overflow="visible" id="glyph2-2">
<path style="stroke:none;" d="M -0.703125 -5.703125 C -0.78125 -5.75 -0.84375 -5.78125 -0.9375 -5.703125 C -1.046875 -5.609375 -1.03125 -5.546875 -1 -5.4375 L 0.390625 -1.28125 C 0.453125 -1.125 0.5625 -0.796875 0.078125 -0.390625 L 0.234375 -0.203125 C 0.40625 -0.359375 0.59375 -0.546875 0.78125 -0.6875 C 0.984375 -0.875 1.40625 -1.171875 1.4375 -1.203125 L 1.28125 -1.390625 C 1.046875 -1.1875 0.796875 -1.171875 0.671875 -1.3125 C 0.640625 -1.359375 0.625 -1.390625 0.609375 -1.453125 L 0.3125 -2.3125 L 1.828125 -3.59375 L 2.796875 -3.09375 C 2.8125 -3.0625 2.875 -3.046875 2.890625 -3.015625 C 3.03125 -2.859375 2.734375 -2.625 2.59375 -2.5 L 2.75 -2.3125 C 3 -2.546875 3.34375 -2.859375 3.53125 -3 C 3.78125 -3.21875 4.203125 -3.53125 4.25 -3.5625 L 4.09375 -3.75 L 4 -3.671875 C 3.640625 -3.375 3.5625 -3.40625 3.375 -3.5 Z M -0.546875 -4.890625 L 1.59375 -3.71875 L 0.234375 -2.578125 Z M -0.546875 -4.890625 "/>
</symbol>
<symbol overflow="visible" id="glyph2-3">
<path style="stroke:none;" d="M 3.09375 -4.375 C 2.890625 -4.609375 2.953125 -4.671875 3.3125 -4.96875 L 3.15625 -5.15625 C 3.109375 -5.109375 2.75 -4.78125 2.484375 -4.5625 C 2.1875 -4.3125 1.796875 -3.984375 1.5 -3.765625 L 1.65625 -3.578125 L 1.859375 -3.734375 C 2.390625 -4.1875 2.453125 -4.109375 2.59375 -3.953125 L 2.890625 -3.59375 C 2.984375 -3.484375 3.15625 -3.28125 2.96875 -2.875 C 2.84375 -2.515625 2.546875 -2.265625 2.46875 -2.203125 C 1.859375 -1.6875 0.59375 -1.234375 -0.578125 -2.625 C -1.765625 -4.046875 -1.015625 -5.203125 -0.5 -5.65625 C 0.015625 -6.078125 0.96875 -6.265625 1.859375 -5.453125 C 1.921875 -5.40625 1.96875 -5.4375 2 -5.46875 C 2.09375 -5.546875 2.078125 -5.59375 1.984375 -5.703125 L 0.9375 -6.9375 C 0.859375 -7.03125 0.8125 -7.09375 0.75 -7.046875 C 0.71875 -7.015625 0.703125 -7 0.71875 -6.875 L 0.78125 -6.25 C 0.28125 -6.296875 -0.265625 -6.1875 -0.734375 -5.796875 C -1.859375 -4.859375 -2.0625 -3.203125 -1.15625 -2.140625 C -0.265625 -1.078125 1.375 -0.96875 2.53125 -1.921875 C 2.828125 -2.1875 3.359375 -2.734375 3.296875 -3.328125 C 3.5 -3.25 3.859375 -3.234375 3.90625 -3.28125 C 3.96875 -3.328125 3.921875 -3.390625 3.84375 -3.46875 Z M 3.09375 -4.375 "/>
</symbol>
<symbol overflow="visible" id="glyph3-0">
<path style="stroke:none;" d=""/>
</symbol>
<symbol overflow="visible" id="glyph3-1">
<path style="stroke:none;" d="M 1.265625 -3.140625 C 1.046875 -3.421875 0.171875 -4.453125 -0.828125 -3.609375 C -1.828125 -2.78125 -0.953125 -1.75 -0.734375 -1.46875 C -0.5 -1.203125 0.359375 -0.171875 1.359375 -1 C 2.359375 -1.84375 1.5 -2.875 1.265625 -3.140625 Z M 1.25 -1.125 C 1.109375 -1.015625 0.765625 -0.796875 0.328125 -1.109375 C 0.109375 -1.265625 -0.109375 -1.53125 -0.375 -1.84375 C -0.625 -2.140625 -0.84375 -2.390625 -0.96875 -2.65625 C -1.140625 -3.0625 -0.890625 -3.375 -0.734375 -3.5 C -0.453125 -3.75 -0.125 -3.78125 0.1875 -3.5625 C 0.40625 -3.421875 0.671875 -3.109375 0.859375 -2.875 C 1.078125 -2.609375 1.34375 -2.296875 1.46875 -2.03125 C 1.6875 -1.5625 1.40625 -1.265625 1.25 -1.125 Z M 1.25 -1.125 "/>
</symbol>
</g>
<clipPath id="clip1">
<path d="M 0 74 L 341.351562 74 L 341.351562 76 L 0 76 Z M 0 74 "/>
</clipPath>
<clipPath id="clip2">
<path d="M 67 76 L 206 76 L 206 96.089844 L 67 96.089844 Z M 67 76 "/>
</clipPath>
<clipPath id="clip3">
<path d="M 67 76 L 206 76 L 206 96.089844 L 67 96.089844 Z M 67 76 "/>
</clipPath>
</defs>
<g id="surface1">
<g clip-path="url(#clip1)" clip-rule="nonzero">
<path style="fill:none;stroke-width:1.19553;stroke-linecap:butt;stroke-linejoin:miter;stroke:rgb(0%,0%,0%);stroke-opacity:1;stroke-miterlimit:10;" d="M -170.08225 -0.0001875 L 170.081813 -0.0001875 " transform="matrix(1,0,0,-1,170.676,74.992)"/>
</g>
<path style=" stroke:none;fill-rule:nonzero;fill:rgb(100%,50%,0%);fill-opacity:1;" d="M 14.769531 82.078125 L 43.117188 82.078125 L 43.117188 67.90625 L 14.769531 67.90625 Z M 14.769531 82.078125 "/>
<path style=" stroke:none;fill-rule:nonzero;fill:rgb(0.390625%,49.01886%,47.451782%);fill-opacity:1;" d="M 50.601562 82.078125 L 78.949219 82.078125 L 78.949219 67.90625 L 50.601562 67.90625 Z M 50.601562 82.078125 "/>
<path style=" stroke:none;fill-rule:nonzero;fill:rgb(100%,0%,0%);fill-opacity:1;" d="M 86.433594 82.078125 L 114.78125 82.078125 L 114.78125 67.90625 L 86.433594 67.90625 Z M 86.433594 82.078125 "/>
<path style=" stroke:none;fill-rule:nonzero;fill:rgb(0.390625%,49.01886%,47.451782%);fill-opacity:1;" d="M 122.265625 82.078125 L 150.609375 82.078125 L 150.609375 67.90625 L 122.265625 67.90625 Z M 122.265625 82.078125 "/>
<path style=" stroke:none;fill-rule:nonzero;fill:rgb(0.390625%,49.01886%,47.451782%);fill-opacity:1;" d="M 158.097656 82.078125 L 186.441406 82.078125 L 186.441406 67.90625 L 158.097656 67.90625 Z M 158.097656 82.078125 "/>
<path style=" stroke:none;fill-rule:nonzero;fill:rgb(0.390625%,49.01886%,47.451782%);fill-opacity:1;" d="M 193.929688 82.078125 L 222.273438 82.078125 L 222.273438 67.90625 L 193.929688 67.90625 Z M 193.929688 82.078125 "/>
<path style=" stroke:none;fill-rule:nonzero;fill:rgb(0%,31.373596%,70.588684%);fill-opacity:1;" d="M 229.761719 82.078125 L 258.105469 82.078125 L 258.105469 67.90625 L 229.761719 67.90625 Z M 229.761719 82.078125 "/>
<path style=" stroke:none;fill-rule:nonzero;fill:rgb(0%,31.373596%,70.588684%);fill-opacity:1;" d="M 265.59375 82.078125 L 293.9375 82.078125 L 293.9375 67.90625 L 265.59375 67.90625 Z M 265.59375 82.078125 "/>
<path style=" stroke:none;fill-rule:nonzero;fill:rgb(100%,50%,0%);fill-opacity:1;" d="M 301.425781 82.078125 L 329.769531 82.078125 L 329.769531 67.90625 L 301.425781 67.90625 Z M 301.425781 82.078125 "/>
<path style="fill:none;stroke-width:0.3985;stroke-linecap:butt;stroke-linejoin:miter;stroke:rgb(100%,50%,0%);stroke-opacity:1;stroke-miterlimit:10;" d="M -133.058812 7.284969 C -52.609594 74.792781 55.796656 74.792781 136.245875 7.284969 " transform="matrix(1,0,0,-1,170.676,74.992)"/>
<path style=" stroke:none;fill-rule:nonzero;fill:rgb(0%,0%,0%);fill-opacity:1;" d="M 174.382812 17.074219 C 174.382812 15.910156 173.4375 14.960938 172.269531 14.960938 C 171.101562 14.960938 170.15625 15.910156 170.15625 17.074219 C 170.15625 18.242188 171.101562 19.1875 172.269531 19.1875 C 173.4375 19.1875 174.382812 18.242188 174.382812 17.074219 Z M 174.382812 17.074219 "/>
<g style="fill:rgb(100%,50%,0%);fill-opacity:1;">
<use xlink:href="#glyph0-1" x="33.278" y="65.453"/>
</g>
<g style="fill:rgb(100%,50%,0%);fill-opacity:1;">
<use xlink:href="#glyph0-2" x="37.143016" y="62.209802"/>
</g>
<g style="fill:rgb(100%,50%,0%);fill-opacity:1;">
<use xlink:href="#glyph0-3" x="41.48241" y="58.568544"/>
</g>
<g style="fill:rgb(100%,50%,0%);fill-opacity:1;">
<use xlink:href="#glyph1-1" x="46.844673" y="55.370452"/>
</g>
<g clip-path="url(#clip2)" clip-rule="nonzero">
<path style="fill:none;stroke-width:0.3985;stroke-linecap:butt;stroke-linejoin:miter;stroke:rgb(0.390625%,49.01886%,47.451782%);stroke-opacity:1;stroke-miterlimit:10;" d="M -97.222875 -7.285344 C -81.000219 -20.898625 -59.140844 -20.898625 -42.918187 -7.285344 M -25.558812 -7.285344 C -20.039281 -11.91425 -12.605687 -11.91425 -7.086156 -7.285344 M 10.273219 -7.285344 C 15.79275 -11.91425 23.226344 -11.91425 28.745875 -7.285344 " transform="matrix(1,0,0,-1,170.676,74.992)"/>
</g>
<path style="fill:none;stroke-width:0.3985;stroke-linecap:butt;stroke-linejoin:miter;stroke:rgb(0.390625%,49.01886%,47.451782%);stroke-opacity:1;stroke-miterlimit:10;" d="M -97.226781 7.284969 C -70.297094 29.882625 -34.011937 29.882625 -7.08225 7.284969 M -97.226781 7.284969 C -59.593969 38.867 -8.883031 38.867 28.749781 7.284969 " transform="matrix(1,0,0,-1,170.676,74.992)"/>
<path style=" stroke:none;fill-rule:nonzero;fill:rgb(0%,0%,0%);fill-opacity:1;" d="M 138.550781 44.023438 C 138.550781 42.855469 137.605469 41.910156 136.4375 41.910156 C 135.269531 41.910156 134.324219 42.855469 134.324219 44.023438 C 134.324219 45.1875 135.269531 46.136719 136.4375 46.136719 C 137.605469 46.136719 138.550781 45.1875 138.550781 44.023438 Z M 138.550781 44.023438 "/>
<g style="fill:rgb(0.390625%,49.01886%,47.451782%);fill-opacity:1;">
<use xlink:href="#glyph0-1" x="69.109" y="65.453"/>
</g>
<g style="fill:rgb(0.390625%,49.01886%,47.451782%);fill-opacity:1;">
<use xlink:href="#glyph0-2" x="72.974016" y="62.209802"/>
</g>
<g style="fill:rgb(0.390625%,49.01886%,47.451782%);fill-opacity:1;">
<use xlink:href="#glyph0-3" x="77.31341" y="58.568544"/>
</g>
<g style="fill:rgb(0.390625%,49.01886%,47.451782%);fill-opacity:1;">
<use xlink:href="#glyph1-2" x="82.675673" y="55.370452"/>
</g>
<g clip-path="url(#clip3)" clip-rule="nonzero">
<path style="fill:none;stroke-width:0.3985;stroke-linecap:butt;stroke-linejoin:miter;stroke:rgb(0.390625%,49.01886%,47.451782%);stroke-opacity:1;stroke-miterlimit:10;" d="M -97.222875 -7.285344 C -81.000219 -20.898625 -59.140844 -20.898625 -42.918187 -7.285344 M -25.558812 -7.285344 C -9.336156 -20.898625 12.523219 -20.898625 28.745875 -7.285344 " transform="matrix(1,0,0,-1,170.676,74.992)"/>
</g>
<path style="fill:none;stroke-width:0.3985;stroke-linecap:butt;stroke-linejoin:miter;stroke:rgb(0%,31.373596%,70.588684%);stroke-opacity:1;stroke-miterlimit:10;" d="M 81.937281 7.284969 C 87.456813 11.917781 94.890406 11.917781 100.409938 7.284969 " transform="matrix(1,0,0,-1,170.676,74.992)"/>
<path style=" stroke:none;fill-rule:nonzero;fill:rgb(0%,0%,0%);fill-opacity:1;" d="M 263.964844 64.234375 C 263.964844 63.066406 263.015625 62.121094 261.851562 62.121094 C 260.683594 62.121094 259.738281 63.066406 259.738281 64.234375 C 259.738281 65.402344 260.683594 66.347656 261.851562 66.347656 C 263.015625 66.347656 263.964844 65.402344 263.964844 64.234375 Z M 263.964844 64.234375 "/>
<g style="fill:rgb(0%,31.373596%,70.588684%);fill-opacity:1;">
<use xlink:href="#glyph2-1" x="248.273" y="65.453"/>
</g>
<g style="fill:rgb(0%,31.373596%,70.588684%);fill-opacity:1;">
<use xlink:href="#glyph2-2" x="252.138116" y="62.209751"/>
</g>
<g style="fill:rgb(0%,31.373596%,70.588684%);fill-opacity:1;">
<use xlink:href="#glyph2-3" x="256.477625" y="58.568437"/>
</g>
<g style="fill:rgb(0%,31.373596%,70.588684%);fill-opacity:1;">
<use xlink:href="#glyph3-1" x="261.840021" y="55.370303"/>
</g>
</g>
</svg>

Before

Width:  |  Height:  |  Size: 16 KiB

View File

@ -27,7 +27,7 @@
| singleton | singleton | A gene with a single copy | | singleton | singleton | A gene with a single copy |
| polyploidisation | polyploidisation | Mechanism leading to the acquisition of at least three versions of the same original genome in a species | | polyploidisation | polyploidisation | Mechanism leading to the acquisition of at least three versions of the same original genome in a species |
| pseudogene | pseudogene | A gene-like sequence that lost its capacity to transcribe | | pseudogene | pseudogene | A gene-like sequence that lost its capacity to transcribe |
| segment_duplication | segment duplication | Long stretches of DNA sequences with high identity score | | segment_duplcation | segment duplication | Long stretches of DNA sequences with high identity score |
| retroduplication | retroduplication | Duplication of a gene through retro-transcription of its RNA transcript | | retroduplication | retroduplication | Duplication of a gene through retro-transcription of its RNA transcript |
| autopolyploidisation | autopolyploidisation | Polyploidisation within the same species | | autopolyploidisation | autopolyploidisation | Polyploidisation within the same species |
| allopolyploidisation | allopolyploidisation | Polyploidisation with genetic material coming from a diverged species | | allopolyploidisation | allopolyploidisation | Polyploidisation with genetic material coming from a diverged species |
@ -66,26 +66,29 @@
#+end_export #+end_export
* Scientific context * Scientific context
[[latex:lettrine][D]]uplicate genes represent an important fraction of Eukaryotic genes: It is estimated that between 46% and 65.5% of human genes could be considered as duplicate[fn:: The estimate vary strongly depending on the criteria in use, because ancient duplication event may be hard to detect.] [cite:@correaTransposableElementEnvironment2021]. \lettrine{D}uplicate genes represent an important fraction of Eukaryotic genes: It is estimated that between 46% and 65.5% of human genes could be considered as duplicate[fn:: The estimate vary strongly depending on the criteria in use, because ancient duplication event may be hard to detect.] [cite:@correaTransposableElementEnvironment2021].
Duplicate genes offers a pool of genetic material available for further experimentation during species evolution. Duplicate genes offers a pool of genetic material available for further experimentation during species evolution.
** Gene duplication mechanisms ** Gene duplication mechanisms
#+begin_src emacs-lisp :exports results :results raw #+begin_src emacs-lisp :exports results :results value raw
(setq fig:gene-duplication-mechanisms "#+label: fig:gene-duplication-mechanisms (setq fig:gene-duplication-mechanisms "
#+caption[Different types of duplication]: Different types of duplication. (A) Whole genome duplication. (B) An unequal crossing-over leads to a duplication of a fragment of a chromosome. (C) In tandem duplication, two (set of) genes are duplicated one after the other. (D) Retrotransposon enables retroduplication: a RNA transcript is reverse transcribed and inserted back without introns and with a polyA tail in the genome. (E) A DNA transposon can acquire a fragment of a gene. (F) Segmental duplication corresponds to long stretches of duplicated sequences with high identity. Adapted from [cite:@lallemandOverviewDuplicatedGene2020] (fig. 1) #+label: fig:gene-duplication-mechanisms
#+caption[Different types of duplication] Different types of duplication. (A) Whole genome duplication. (B) An unequal crossing-over leads to a duplication of a fragment of a chromosome. (C) In tandem duplication, two (set of) genes are duplicated one after the other. (D) Retrotransposon enables retroduplication: a RNA transcript is reverse transcribed and inserted back without introns and with a polyA tail in the genome. (E) A DNA transposon can acquire a fragment of a gene. (F) Segmental duplication corresponds to long stretches of duplicated sequences with high identity. Adapted from [cite:@lallemandOverviewDuplicatedGene2020] (fig. 1)
[[./figures/lallemand2020-fig1_copy.svg]]") [[./figures/lallemand2020-fig1_copy.svg]]")
(if (eq org-export-current-backend 'html) (if (eq org-export-current-backend 'html)
fig:gene-duplication-mechanisms fig:gene-duplication-mechanisms
"" "")
)
#+end_src #+end_src
#+RESULTS: fig:gene-duplication-mechanisms
#+begin_export latex #+begin_export latex
\fladdfig{ \fladdfig{
\includegraphics[width=.9\linewidth]{./figures/lallemand2020-fig1_copy.pdf} \includegraphics[width=.9\linewidth]{./figures/lallemand2020-fig1_copy.pdf}
\caption[Different types of duplication]{\label{fig:gene-duplication-mechanisms}Different types of duplication. (A) Whole genome duplication. (B) An unequal crossing-over leads to a duplication of a fragment of a chromosome. (C) In tandem duplication, two (set of) genes are duplicated one after the other. (D) Retrotransposon enables retroduplication: a RNA transcript is reverse transcribed and inserted back without introns and with a polyA tail in the genome. (E) A DNA transposon can acquire a fragment of a gene. (F) Segmental duplication corresponds to long stretches of duplicated sequences with high identity. (Adapted from \textcite{lallemandOverviewDuplicatedGene2020} (fig. 1)).} \caption[Different types of duplication]{\label{fig:gene-duplication-mechanisms}Different types of duplication. (A) Whole genome duplication. (B) An unequal crossing-over leads to a duplication of a fragment of a chromosome. (C) In tandem duplication, two (set of) genes are duplicated one after the other. (D) Retrotransposon enables retroduplication: a RNA transcript is reverse transcribed and inserted back without introns and with a polyA tail in the genome. (E) A DNA transposon can acquire a fragment of a gene. (F) Segmental duplication corresponds to long stretches of duplicated sequences with high identity. Adapted from \autocite{lallemandOverviewDuplicatedGene2020} (fig. 1).}
} }
#+end_export #+end_export
@ -120,23 +123,12 @@ A typical DNA transposon contains a transposase gene. This enzyme recognizes two
Finally, glspl:segment_duplication, also called /low copy repeats/ are long stretches of DNA with high identity score ([[cref:fig:gene-duplication-mechanisms]] (F)). Their exact duplication mechanism remains unclear [cite:@lallemandOverviewDuplicatedGene2020]. They may come from an accidental replication, distinct from an uneven cross-over or a double stranded breakage. Finally, glspl:segment_duplication, also called /low copy repeats/ are long stretches of DNA with high identity score ([[cref:fig:gene-duplication-mechanisms]] (F)). Their exact duplication mechanism remains unclear [cite:@lallemandOverviewDuplicatedGene2020]. They may come from an accidental replication, distinct from an uneven cross-over or a double stranded breakage.
Transposable elements may well be involved in the mechanism, as a high enrichment of transposable elements is found next to duplicate segment extremities, in /Drosophila/ [cite:@lallemandOverviewDuplicatedGene2020]. Transposable elements may well be involved in the mechanism, as a high enrichment of transposable elements is found next to duplicate segment extremities, in /Drosophila/ [cite:@lallemandOverviewDuplicatedGene2020].
#+begin_src emacs-lisp :exports results :results raw
(setq fig:duplicate-genes-fate "#+label: fig:duplicate-genes-fate
,#+caption[Fate of duplicate genes]: Fate of duplicate genes. An original gene with four functions is duplicated. Its two copies may both keep the original functions (functional redoundancy). The original functions may split between the different copies (subfunctionalization). One of the copy may acquire a new function (neofunctionalization). It may also degenerate and lose its original functions (pseudogenization). Adapted from [[https://commons.wikimedia.org/wiki/File:Evolution_fate_duplicate_genes_-_vector.svg][Smedlib]], [[https://creativecommons.org/licenses/by-sa/4.0][CC BY-SA 4.0]] via Wikimedia Commons.
[[./figures/Evolution_fate_duplicate_genes.svg]]")
(if (eq org-export-current-backend 'html)
fig:duplicate-genes-fate
""
)
#+end_src
#+RESULTS:
#+begin_export latex #+begin_export latex
\fladdfig{ \fladdfig{
\includegraphics[width=.9\linewidth]{figures/Evolution_fate_duplicate_genes.pdf} \includegraphics[width=.9\linewidth]{figures/Evolution_fate_duplicate_genes.pdf}
\caption[Fate of duplicate genes]{\label{fig:fate-duplicate-genes} Fate of duplicate genes. An original gene with four functions is duplicated. Its two copies may both keep the original functions (functional redoundancy). The original functions may split between the different copies (subfunctionalization). One of the copy may acquire a new function (neofunctionalization). It may also degenerate and lose its original functions (pseudogenization). (Adapted from \href{https://commons.wikimedia.org/wiki/File:Evolution_fate_duplicate_genes_-_vector.svg}{Smedlib}, \href{https://creativecommons.org/licenses/by-sa/4.0}{CC BY-SA 4.0}, via Wikimedia Commons).} \caption[Fate of duplicate genes]{\label{fig:fate-duplicate-genes} Fate of duplicate genes. An original gene with four functions is duplicated. Its two copies may both keep the original functions (functional redoundancy). The original functions may split between the different copies (subfunctionalization). One of the copy may acquire a new function (neofunctionalization). It may also degenerate and lose its original functions (pseudogenization).
Adapted from \href{https://commons.wikimedia.org/wiki/File:Evolution_fate_duplicate_genes_-_vector.svg}{Smedlib}, \href{https://creativecommons.org/licenses/by-sa/4.0}{CC BY-SA 4.0}, via Wikimedia Commons}
} }
#+end_export #+end_export
@ -157,49 +149,7 @@ Two duplicate genes with the same original function may encounter a gls:subfunct
# *** Functional redundancy # *** Functional redundancy
Another possibility is that the two gene copies keep the ancestral function, resulting in a functional redoundancy. In this case the quantity of gene product may increase. Another possibility is that the two gene copies keep the ancestral function, resulting in a functional redoundancy. In this case the quantity of gene product may increase.
* Objectives for the internship ** Methods to identify duplicate genes
** Scientific questions
The underlying question of FTAG Finder is the study of the evolutionary fate of duplicate genes in Eukaryotes.
Duplicate genes are
** Extend the existing FTAG Finder Galaxy pipeline
Galaxy is a web-based platform for running accessible data analysis pipelines, first designed for use in genomics data analysis [cite:@goecksGalaxyComprehensiveApproach2010].
Last year, Séanna [[latex:textsc][Charles]] worked on the Galaxy version of the FTAG Finder pipeline during her M1 internship [cite:@charlesFinalisationPipelineFTAG2023]. I will continue this work.
FTAG Finder is currently deployed on the server of the /Laboratoire de Mathématiques et Modélisation d'Évry/[fn:: [[http://stat.genopole.cnrs.fr/galaxy]] ].
** Port FTAG Finder pipeline on a workflow manager
Another objective of my internship will be to port FTAG Finder on a workflow manager better suited to larger and more reproducible analysis.
We will have to make a choice for the tool we will use.
The two main options being Snakemake and Nextflow. Snakemake is a python powered workflow manager based on rules /à la/ GNU Make [cite:@kosterSnakemakeScalableBioinformatics2012]. Nextflow is a groovy powered workflow manager, which rely on the data flows paradigm [cite:@ditommasoNextflowEnablesReproducible2017]. Both are widely used in the bioinformatics community. Their use have been on the rise since they came out in 2012 and 2013 respectively [cite:@djaffardjyDevelopingReusingBioinformatics2023].
# #+begin_export latex
# \fladdtab{
# \begin{tabular}{ccc}
# \toprule
# & List ref & List $L$ \\
# \midrule
# related to $go$ & $a$ & $b$ \\
# unrelated & $c$ & $d$ \\
# \bottomrule
# \end{tabular}
# \caption{\label{tab:fisher-test-contigency-table}Contingency table for a Fisher exact test on gene lists}
# }
# #+end_export
* Methodological approaches
** Duplicate gene detection method used in FTAG Finder
#+begin_src emacs-lisp :exports results :results raw
(setq fig:tag-definitions "#+label: fig:tag-definitions
#+caption[Schematic representation of TAG definitions]: Schematic representation of TAG definitions. Several genes are represented on a linear chromosome. The red box represent a singleton gene. Orange boxes represent a TAG with two duplicate genes seperated by 7 other genes ($\\mathrm{TAG}_7$). Four green boxes constitute a TAG, the gene at the extremities are seperated by three genes ($\\mathrm{TAG}_3$). The two blue boxes represents a TAG with two genes next to each other ($\\mathrm{TAG}_0$). The bended edges represents the homology links between each pair of genes within a TAG.
[[./figures/tag-definition.svg]]")
(if (eq org-export-current-backend 'html)
fig:tag-definitions
""
)
#+end_src
#+begin_export latex #+begin_export latex
\fladdfig{ \fladdfig{
\includegraphics[width=.9\linewidth]{./figures/tag-definition.pdf} \includegraphics[width=.9\linewidth]{./figures/tag-definition.pdf}
@ -212,50 +162,81 @@ Different methods exists to detect duplicate genes. These methods depend on the
Paralogs are homologous genes derived from a duplication event. We can identify them as homologous genes coming from the same genome, or as homologous genes between different species once we filtered out gls:orthologues (homologous genes derived from a speciation event). Paralogs are homologous genes derived from a duplication event. We can identify them as homologous genes coming from the same genome, or as homologous genes between different species once we filtered out gls:orthologues (homologous genes derived from a speciation event).
We can use two gene characteristics to assess the homology between two genes: gene structure or sequence similarity. We can use two gene characteristics to assess the homology between two genes: gene structure or sequence similarity.
The sequence similarity can be tested with a sequence alignment tool, such as =BLAST= [cite:@altschulBasicLocalAlignment1990], =Psi-BLAST=, and =HMMER3= [cite:@johnsonHiddenMarkovModel2010], or =diamond= [cite:@buchfinkSensitiveProteinAlignments2021]. These tools are heuristic algorithms, which means they may not provide the best results, but do so way faster than exact algorithms, such as the classical Smith and Waterman algorithm [cite:@smithIdentificationCommonMolecular1981] or its optimized versions =PARALIGN= [cite:@rognesParAlignParallelSequence2001] or =SWIMM=. The sequence similarity can be tested with a sequence alignment tool, such as =BLAST= [cite:@altschulBasicLocalAlignment1990], =Psi-BLAST=, and =HMMER3= [cite:@johnsonHiddenMarkovModel2010], or =diamond= [cite:@buchfinkSensitiveProteinAlignments2021], which are heuristic algorithms, which means they may not provide the best results, but do so way faster than exact algorithms, such as the classical Smith and Waterman algorithm [cite:@smithIdentificationCommonMolecular1981] or its optimized versions =PARALIGN= [cite:@rognesParAlignParallelSequence2001] or =SWIMM=.
This is the case for Triticum aestivum hybridisation, which consisted in the union of the
chromosome set of a Triticum species with those of an Aegilops species
*** FTAG Finder *** FTAG Finder
Developed in the LaMME laboratory, the FTAG Finder (Families and Tandemly Arrayed Genes Finder) pipeline is a simple pipeline targeting the detection of gls:TAG based on the sequence of the proteome of single species [cite:@bouillonFTAGFinderOutil2016]. Developed in the LaMME laboratory, the FTAG Finder (Families and Tandemly Arrayed Genes Finder) pipeline is a simple pipeline targeting the detection of gls:TAG from the proteome of single species [cite:@bouillonFTAGFinderOutil2016].
The pipeline proceeds in three steps. First, it estimates the homology links between each pair of genes. Then, it deduces the gene families. Finally, it searches for gls:TAG, relying on the position of genes belonging to the same family. The pipeline proceeds in three steps. First, it estimates the homology links between each pair of genes. Then, it deduces the gene families. Finally, it searches for gls:TAG.
**** Estimation of homology links between genes **** Estimation of homology links between genes
This step consists in establishing a homology relationship between each genes in the proteome. This step consists in establishing a homology relationship between each genes in the proteome.
In this step, FTAG Finder uses =BLAST= (Basic Local Alignment Search Tool) [cite:@altschulBasicLocalAlignment1990] with an "all against all" search on the proteome. In this step, the typical tool involved is =BLAST= (Basic Local Alignment Search Tool) [cite:@altschulBasicLocalAlignment1990] run "all against all" on the proteome.
Several =BLAST= metrics can be used as an homology measure, such as bitscore, identity percentage, E-value or a variation on these. The choice of metrics can affect the results of graph clustering in the following step, and we should therefore chose them carefully [cite:@gibbonsEvaluationBLASTbasedEdgeweighting2015]. Several =BLAST= metrics can be used as an homology measure, such as bitscore, identity percentage, E-value or variations of these. The choice of metrics can affect the results of graph clustering in the following step, and we should therefore chose them carefully [cite:@gibbonsEvaluationBLASTbasedEdgeweighting2015].
**** Identification of gene families **** Identification of gene families
Based on the homology links between each pair of genes, we construct an undirected weighted graph whose vertices correspond to genes and whose edges corresponds to homology links between them. Based on the homology links between each pair of genes, we construct an undirected weighted graph whose vertices correspond to genes and edges to homology links between them.
We apply a graph clustering algorithm on the homology gene graph in order to infer the gene families corresponding to densely connected communities of vertices. We apply a graph clustering algorithm on the graph in order to infer the gene families corresponding to densely connected communities of vertices.
FTAG Finder proposes three graph clustering algorithm alternatives: single linkage, Markov Clustering [cite:@vandongenNewClusterAlgorithm1998] or Walktrap [cite:@ponsComputingCommunitiesLarge2005]. FTAG Finder proposes three clustering algorithm alternatives: single linkage, Markov Clustering [cite:@vandongenNewClusterAlgorithm1998] or Walktrap [cite:@ponsComputingCommunitiesLarge2005].
**** Detection of TAG
**** Detection of TAGs
The final step of FTAG Finder consists in the identification of gls:TAG from the gene families and the positions of genes. The final step of FTAG Finder consists in the identification of gls:TAG from the gene families and the positions of genes.
For a given chromosome, the tool seeks genes belonging to the same family and located close to each other. The tool allows a maximal number of genes between the homologous genes, with a parameter set by the user. Cref:fig:tag-definitions is a schematic representation of some possible gls:TAG positioning on a genome associated with their definition in this FTAG Finder step. For a given chromosome, the tool seeks genes belonging to the same family and located close to each other. The tool allows a maximal number of genes between the homologous genes, with a parameter set by the user. Cref:fig:tag-definitions is a schematic representation of some possible gls:TAG positioning on a genome associated with their definition in FTAG Finder /Find Tags/ step.
** Analyses performed on TAG * Objectives for the internship
** Scientific questions
The underlying question of FTAG Finder is the study of the evolutionary fate of duplicate genes in Eukaryotes.
Duplicate genes are
** Extend the existing FTAG Finder Galaxy pipeline
Galaxy is a web-based platform for running accessible data analysis pipelines, first designed for use in genomics data analysis [cite:@goecksGalaxyComprehensiveApproach2010].
Last year, Séanna [[latex:textsc][Charles]] worked on the Galaxy version of the FTAG Finder pipeline during her M1 internship [cite:@charlesFinalisationPipelineFTAG2023]. I will continue this work.
FTAG Finder is currently deployed on the server of the /Laboratoire d'Analyse et Modélisation d'Évry/[fn: [[http://stat.genopole.cnrs.fr/galaxy]] ].
FTAG Finder output consist mostly in list of genes, corresponding to TAG of various definition. These list can be subsequently used as the basis of more specific statistical analysis. ** Port FTAG Finder pipeline on a workflow manager
Another objective of my internship will be to port FTAG Finder on a workflow manager better suited to larger and more reproducible analysis.
*** Are there over-represented gene functions among TAG We will have to make a choice for the tool we will use.
The two main options being Snakemake and Nextflow. Snakemake is a python powered workflow manager based on rules /à la/ GNU Make [cite:@kosterSnakemakeScalableBioinformatics2012]. Nextflow is a groovy powered workflow manager, which rely on the data flows paradigm [cite:@ditommasoNextflowEnablesReproducible2017]. Both are widely used in the bioinformatics community. Their use have been on the rise since they came out in 2012 and 2013 respectively [cite:@djaffardjyDevelopingReusingBioinformatics2023].
The gls:GO describes biological concepts across three main classes: Cellular Component, Molecular Function and Biological Process. It describes a controlled vocabulary of concepts and the relationships between them. We can link genes with function annotation with particular GO terms. We can then perform an GO enrichment analysis to assess whether a particular GO term is over-represented in a particular gene list, compared to another. To do so, we can use a Fisher exact test, using the FDR (False Discovery Rate) control procedure of [[latex:textsc][Benjamini]] and [[latex:textsc][Hocheberg]]. #+begin_export latex
\fladdtab{
\begin{tabular}{ccc}
\toprule
& List ref & List $L$ \\
\midrule
related to $go$ & $a$ & $b$ \\
unrelated & $c$ & $d$ \\
\bottomrule
\end{tabular}
\caption{\label{tab:fisher-test-contigency-table}Contingency table for a Fisher exact test on gene lists}
}
#+end_export
* Methodological approaches
# Let $go$ be a GO term. We construct a contingency matrix based on the count of genes associated with this GO term (or associated with one of its brother GO term) for the reference gene list and the list of interest (here, the list of genes in a TAG) (see cref:tab:fisher-test-contigency-table). Based on the output of the FTAG Finder pipeline, which consist in lists of genes, researchers could perform bespoke subsequent analyses on TAGs.
*** Are TAG located preferentially on specific chromosome region?
*** Are there chromosomes enriched or depleted in TAG? ** Analysis of over-represented gene functions among TAGs
The gls:GO describes biological concepts across three main classes: Cellular Component, Molecular Function and Biological Process. It describe a controlled vocabulary of concepts and the relationship between them. The genes with known functions can be associated with a particular GO term. We can perform an GO enrichment analysis to assess whether a particular GO term is over-represented in a particular gene list, compared to an other. We can use a Fisher exact test, using the FDR (False Discovery Rate) control procedure of [[latex:textsc][Benjamini]] and [[latex:textsc][Hocheberg]] to do so.
*** Do genes located next to each other in a TAG share the same orientation? Let $go$ be a GO term. We construct a contingency matrix based on the count of genes associated with this GO term (or associated with one of its brother GO term) for the reference gene list and the list of interest (here, the list of genes in a TAG) (see cref:tab:fisher-test-contigency-table).
** Are TAG located preferentially on specific chromosome region?
** Are there chromosomes enriched or depleted in TAG?
** Do genes located next to each other in a TAG share the same orientation?
The concordance of two genes of a TAG falls in three possible cases: either both genes are on the same strand (\(\rightarrow \rightarrow\)), either they have a divergent orientation (\(\leftarrow \rightarrow\)), or a convergent one (\(\rightarrow \leftarrow\)). Graham conjectured that genes of a TAG that are close to each other would be more likely to share the same orientation, and it seems to be effectively the case [cite:@shojaRoadmapTandemlyArrayed2006]. The concordance of two genes of a TAG falls in three possible cases: either both genes are on the same strand (\(\rightarrow \rightarrow\)), either they have a divergent orientation (\(\leftarrow \rightarrow\)), or a convergent one (\(\rightarrow \leftarrow\)). Graham conjectured that genes of a TAG that are close to each other would be more likely to share the same orientation, and it seems to be effectively the case [cite:@shojaRoadmapTandemlyArrayed2006].
# To test this, we can use a $\Chi^2$ test of goodness of fit or a Student $t$-test. # To test this, we can use a $\Chi^2$ test of goodness of fit or a Student $t$-test.
*** What is the robustness and accuracy of the detection method? *** TODO write down the hypotheses
[cite/t:@le-hoangEtudeTranscriptomiqueGenes2017] started analyzing the impact of parameter choice on FTAG Finder results. A more detailed benchmark of FTAG Finder in comparison with other methods on some controlled test dataset might be of particular interest. ** What is the robustness and accuracy of the detection method?
This would pose the challenge of homogenization of the outputs of the different methods.
[cite/t:@le-hoangEtudeTranscriptomiqueGenes2017] started analyses of the impact of parameter choice on FTAG Finder output lists. A more detailed benchmark of FTAG Finder in comparison with other methods on some known test dataset might be of particular interest.
#+begin_export latex #+begin_export latex
\flstop \flstop
@ -266,7 +247,9 @@ This would pose the challenge of homogenization of the outputs of the different
:UNNUMBERED: t :UNNUMBERED: t
:END: :END:
#+print_bibliography: #+begin_export latex
\printbibliography[heading=none]
#+end_export
#+begin_export latex #+begin_export latex
\cleartoleftpage \cleartoleftpage
@ -316,8 +299,10 @@ Principle: construct vertex communities based on where an agent would get stuck
: Loaded ./setup.el : Loaded ./setup.el
#+begin_example
# LocalWords: speciation subfunctionalization neofunctionalization # LocalWords: speciation subfunctionalization neofunctionalization
# LocalWords: pseudogenization bioinformatics # LocalWords: pseudogenization bioinformatics
# # Local Variables: # Local Variables:
# # eval: (progn (org-babel-goto-named-src-block "startup") (org-babel-execute-src-block) (outline-hide-sublevels 1)) # eval: (progn (org-babel-goto-named-src-block "startup") (org-babel-execute-src-block) (outline-hide-sublevels 1))
# # End: # End:
#+end_example

BIN
report.pdf (Stored with Git LFS)

Binary file not shown.