Amend text and switch figure extension based on HTML or LaTeX export
This commit is contained in:
parent
a9c2944d66
commit
354c1fd1ca
BIN
figures/lallemand2020-fig1_copy.pdf (Stored with Git LFS)
BIN
figures/lallemand2020-fig1_copy.pdf (Stored with Git LFS)
Binary file not shown.
|
@ -2,9 +2,9 @@
|
||||||
<!-- Created with Inkscape (http://www.inkscape.org/) -->
|
<!-- Created with Inkscape (http://www.inkscape.org/) -->
|
||||||
|
|
||||||
<svg
|
<svg
|
||||||
width="210mm"
|
width="200mm"
|
||||||
height="297mm"
|
height="230mm"
|
||||||
viewBox="0 0 210 297"
|
viewBox="0 0 200 230"
|
||||||
version="1.1"
|
version="1.1"
|
||||||
id="svg1"
|
id="svg1"
|
||||||
inkscape:version="1.3.2 (091e20ef0f, 2023-11-25)"
|
inkscape:version="1.3.2 (091e20ef0f, 2023-11-25)"
|
||||||
|
@ -28,8 +28,8 @@
|
||||||
inkscape:document-units="mm"
|
inkscape:document-units="mm"
|
||||||
showgrid="true"
|
showgrid="true"
|
||||||
inkscape:zoom="0.74398314"
|
inkscape:zoom="0.74398314"
|
||||||
inkscape:cx="401.89083"
|
inkscape:cx="51.076426"
|
||||||
inkscape:cy="616.94947"
|
inkscape:cy="404.57906"
|
||||||
inkscape:window-width="1920"
|
inkscape:window-width="1920"
|
||||||
inkscape:window-height="1008"
|
inkscape:window-height="1008"
|
||||||
inkscape:window-x="0"
|
inkscape:window-x="0"
|
||||||
|
@ -39,8 +39,8 @@
|
||||||
<inkscape:grid
|
<inkscape:grid
|
||||||
id="grid2"
|
id="grid2"
|
||||||
units="mm"
|
units="mm"
|
||||||
originx="0"
|
originx="-5.0000023"
|
||||||
originy="0"
|
originy="-5.0000001"
|
||||||
spacingx="0.99999998"
|
spacingx="0.99999998"
|
||||||
spacingy="1"
|
spacingy="1"
|
||||||
empcolor="#0099e5"
|
empcolor="#0099e5"
|
||||||
|
@ -173,7 +173,8 @@
|
||||||
<g
|
<g
|
||||||
inkscape:label="Layer 1"
|
inkscape:label="Layer 1"
|
||||||
inkscape:groupmode="layer"
|
inkscape:groupmode="layer"
|
||||||
id="layer1">
|
id="layer1"
|
||||||
|
transform="translate(-5.0000024,-5)">
|
||||||
<g
|
<g
|
||||||
id="g64">
|
id="g64">
|
||||||
<g
|
<g
|
||||||
|
@ -379,7 +380,7 @@
|
||||||
</g>
|
</g>
|
||||||
<path
|
<path
|
||||||
style="fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none;stroke-opacity:1;marker-end:url(#ArrowTriangleStylized)"
|
style="fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none;stroke-opacity:1;marker-end:url(#ArrowTriangleStylized)"
|
||||||
d="m 90.456771,34.997399 25.032419,0.0026"
|
d="m 89.999994,34.997399 25.032416,0.0026"
|
||||||
id="path23" />
|
id="path23" />
|
||||||
<text
|
<text
|
||||||
xml:space="preserve"
|
xml:space="preserve"
|
||||||
|
@ -403,19 +404,19 @@
|
||||||
sodipodi:nodetypes="cc" />
|
sodipodi:nodetypes="cc" />
|
||||||
<path
|
<path
|
||||||
style="fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none;stroke-opacity:1;marker-end:url(#ArrowTriangleStylized)"
|
style="fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none;stroke-opacity:1;marker-end:url(#ArrowTriangleStylized)"
|
||||||
d="m 90.456777,68.997621 25.032413,0.003"
|
d="m 90.000002,68.997621 25.032418,0.003"
|
||||||
id="path24" />
|
id="path24" />
|
||||||
<text
|
<text
|
||||||
xml:space="preserve"
|
xml:space="preserve"
|
||||||
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:4.23333px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal;fill:#000000;fill-opacity:0.913725;stroke-width:1"
|
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:4.23333px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal;fill:#000000;fill-opacity:0.913725;stroke-width:1"
|
||||||
x="86.394516"
|
x="87.620811"
|
||||||
y="61.889977"
|
y="61.320938"
|
||||||
id="text3"><tspan
|
id="text3"><tspan
|
||||||
sodipodi:role="line"
|
sodipodi:role="line"
|
||||||
id="tspan3"
|
id="tspan3"
|
||||||
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:4.23333px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal;stroke-width:1"
|
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:4.23333px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal;stroke-width:1"
|
||||||
x="86.394516"
|
x="87.620811"
|
||||||
y="61.889977">unequal crossing-over</tspan></text>
|
y="61.320938">unequal crossing-over</tspan></text>
|
||||||
<path
|
<path
|
||||||
style="fill:none;fill-opacity:0.913725;stroke:#ffaaaa;stroke-width:1"
|
style="fill:none;fill-opacity:0.913725;stroke:#ffaaaa;stroke-width:1"
|
||||||
d="m 43.015474,82.180432 0.03973,8.74277"
|
d="m 43.015474,82.180432 0.03973,8.74277"
|
||||||
|
@ -505,41 +506,41 @@
|
||||||
</g>
|
</g>
|
||||||
<text
|
<text
|
||||||
xml:space="preserve"
|
xml:space="preserve"
|
||||||
style="font-size:4.2333298px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none;stroke-opacity:1;font-weight:normal;font-style:normal;font-stretch:normal;font-variant:normal;font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal"
|
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:4.23333px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal;fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none;stroke-opacity:1"
|
||||||
x="75.085213"
|
x="75.085213"
|
||||||
y="151.30989"
|
y="151.30989"
|
||||||
id="text4"><tspan
|
id="text4"><tspan
|
||||||
sodipodi:role="line"
|
sodipodi:role="line"
|
||||||
id="tspan4"
|
id="tspan4"
|
||||||
style="fill:#000000;stroke:none;stroke-width:1;-inkscape-font-specification:'TeX Gyre Termes, Normal';font-family:'TeX Gyre Termes';font-weight:normal;font-style:normal;font-stretch:normal;font-variant:normal;font-size:4.2333298px;font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal"
|
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:4.23333px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal;fill:#000000;stroke:none;stroke-width:1"
|
||||||
x="75.085213"
|
x="75.085213"
|
||||||
y="151.30989" /></text>
|
y="151.30989" /></text>
|
||||||
<text
|
<text
|
||||||
xml:space="preserve"
|
xml:space="preserve"
|
||||||
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:4.23333px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal;fill:#000000;fill-opacity:0.913725;stroke:none;stroke-width:1;stroke-dasharray:1, 1"
|
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:4.23333px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal;fill:#000000;fill-opacity:0.913725;stroke:none;stroke-width:1;stroke-dasharray:1, 1"
|
||||||
x="92.428703"
|
x="90.094139"
|
||||||
y="163.95569"
|
y="163.34464"
|
||||||
id="text6"><tspan
|
id="text6"><tspan
|
||||||
sodipodi:role="line"
|
sodipodi:role="line"
|
||||||
id="tspan6"
|
id="tspan6"
|
||||||
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:4.23333px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal;stroke-width:1"
|
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:4.23333px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal;stroke-width:1"
|
||||||
x="92.428703"
|
x="90.094139"
|
||||||
y="163.95569">transduplication</tspan></text>
|
y="163.34464">transduplication</tspan></text>
|
||||||
<path
|
<path
|
||||||
style="fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none;stroke-opacity:1;marker-end:url(#ArrowTriangleStylized)"
|
style="fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none;stroke-opacity:1;marker-end:url(#ArrowTriangleStylized)"
|
||||||
d="m 89.186472,102.99821 25.032418,0.003"
|
d="m 90.000002,102.99821 25.032418,0.003"
|
||||||
id="path1" />
|
id="path1" />
|
||||||
<text
|
<text
|
||||||
xml:space="preserve"
|
xml:space="preserve"
|
||||||
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:4.23333px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal;fill:#000000;fill-opacity:0.913725;stroke:#ffaaaa;stroke-width:1;stroke-dasharray:1, 1"
|
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:4.23333px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal;fill:#000000;fill-opacity:0.913725;stroke:#ffaaaa;stroke-width:1;stroke-dasharray:1, 1"
|
||||||
x="88.718613"
|
x="89.944908"
|
||||||
y="95.573738"
|
y="96.640633"
|
||||||
id="text5"><tspan
|
id="text5"><tspan
|
||||||
sodipodi:role="line"
|
sodipodi:role="line"
|
||||||
id="tspan5"
|
id="tspan5"
|
||||||
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:4.23333px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal;fill:#000000;stroke:none;stroke-width:1"
|
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:4.23333px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal;fill:#000000;stroke:none;stroke-width:1"
|
||||||
x="88.718613"
|
x="89.944908"
|
||||||
y="95.573738">tandem duplication</tspan></text>
|
y="96.640633">tandem duplication</tspan></text>
|
||||||
<g
|
<g
|
||||||
id="g54"
|
id="g54"
|
||||||
transform="matrix(0.75018563,0,0,0.75018563,30.108223,22.451333)">
|
transform="matrix(0.75018563,0,0,0.75018563,30.108223,22.451333)">
|
||||||
|
@ -730,7 +731,7 @@
|
||||||
y="129.25327">retroduplication</tspan></text>
|
y="129.25327">retroduplication</tspan></text>
|
||||||
<path
|
<path
|
||||||
style="fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none;stroke-opacity:1;marker-end:url(#ArrowTriangleStylized-0)"
|
style="fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none;stroke-opacity:1;marker-end:url(#ArrowTriangleStylized-0)"
|
||||||
d="m 90.456779,136.99881 25.032411,0.003"
|
d="m 89.622314,134.99671 25.032406,0.003"
|
||||||
id="path1-7" />
|
id="path1-7" />
|
||||||
<path
|
<path
|
||||||
style="fill:#000000;fill-opacity:1;stroke:#000000;stroke-width:0.25;stroke-dasharray:none;stroke-opacity:1"
|
style="fill:#000000;fill-opacity:1;stroke:#000000;stroke-width:0.25;stroke-dasharray:none;stroke-opacity:1"
|
||||||
|
@ -914,7 +915,7 @@
|
||||||
y="157.28877">retrocopy</tspan></text>
|
y="157.28877">retrocopy</tspan></text>
|
||||||
<path
|
<path
|
||||||
style="fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none;stroke-opacity:1;marker-end:url(#ArrowTriangleStylized-0)"
|
style="fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none;stroke-opacity:1;marker-end:url(#ArrowTriangleStylized-0)"
|
||||||
d="m 92.483797,170.9994 25.032413,0.003"
|
d="m 90.000002,170.9994 25.032418,0.003"
|
||||||
id="path69" />
|
id="path69" />
|
||||||
<path
|
<path
|
||||||
style="fill:none;fill-opacity:1;stroke:#000000;stroke-width:0.25;stroke-dasharray:none;stroke-opacity:1"
|
style="fill:none;fill-opacity:1;stroke:#000000;stroke-width:0.25;stroke-dasharray:none;stroke-opacity:1"
|
||||||
|
@ -1028,7 +1029,8 @@
|
||||||
<g
|
<g
|
||||||
inkscape:groupmode="layer"
|
inkscape:groupmode="layer"
|
||||||
id="layer2"
|
id="layer2"
|
||||||
inkscape:label="Caption">
|
inkscape:label="Caption"
|
||||||
|
transform="translate(-5.0000024,-5)">
|
||||||
<text
|
<text
|
||||||
xml:space="preserve"
|
xml:space="preserve"
|
||||||
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:4.23333px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal;fill:none;fill-opacity:0.913725;stroke:#cccccc;stroke-width:1"
|
style="font-style:normal;font-variant:normal;font-weight:normal;font-stretch:normal;font-size:4.23333px;font-family:'TeX Gyre Termes';-inkscape-font-specification:'TeX Gyre Termes, Normal';font-variant-ligatures:normal;font-variant-caps:normal;font-variant-numeric:normal;font-variant-east-asian:normal;fill:none;fill-opacity:0.913725;stroke:#cccccc;stroke-width:1"
|
||||||
|
|
Before Width: | Height: | Size: 50 KiB After Width: | Height: | Size: 50 KiB |
74
report.org
74
report.org
|
@ -1,4 +1,4 @@
|
||||||
#+title: Further development on FTAG Finder, a pipeline to identify Tandemly Arrayed Genes
|
#+title: Further development on FTAG Finder, a pipeline to identify Gene Families and Tandemly Arrayed Genes
|
||||||
#+author: Samuel Ortion
|
#+author: Samuel Ortion
|
||||||
#+date: 2023-2024
|
#+date: 2023-2024
|
||||||
#+LATEX_CLASS: scientific-project
|
#+LATEX_CLASS: scientific-project
|
||||||
|
@ -16,13 +16,14 @@
|
||||||
| TAG | TAG | Tandemly Arrayed Gene |
|
| TAG | TAG | Tandemly Arrayed Gene |
|
||||||
| FTAG | FTAG | Families and Tandemly Arrayed Gene |
|
| FTAG | FTAG | Families and Tandemly Arrayed Gene |
|
||||||
| WGD | WGD | Whole Genome Duplication |
|
| WGD | WGD | Whole Genome Duplication |
|
||||||
|
| MCL | MCL | Markov Clustering |
|
||||||
|
|
||||||
#+begin_export latex
|
#+begin_export latex
|
||||||
|
\makeatletter
|
||||||
\hypersetup{
|
\hypersetup{
|
||||||
pdfauthor={Samuel Ortion},
|
|
||||||
pdftitle={},
|
|
||||||
pdfkeywords={duplicate genes, workflow management systems, pipeline},
|
pdfkeywords={duplicate genes, workflow management systems, pipeline},
|
||||||
}
|
}
|
||||||
|
\makeatother
|
||||||
\pagenumbering{roman}
|
\pagenumbering{roman}
|
||||||
#+end_export
|
#+end_export
|
||||||
#+begin_myabstract
|
#+begin_myabstract
|
||||||
|
@ -38,7 +39,7 @@ TODO:
|
||||||
#+begin_export latex
|
#+begin_export latex
|
||||||
\tableofcontents
|
\tableofcontents
|
||||||
\listoffigures
|
\listoffigures
|
||||||
\listoftables
|
%\listoftables
|
||||||
#+end_export
|
#+end_export
|
||||||
|
|
||||||
[[printglossaries:]]
|
[[printglossaries:]]
|
||||||
|
@ -48,9 +49,24 @@ TODO:
|
||||||
#+end_export
|
#+end_export
|
||||||
|
|
||||||
* Context
|
* Context
|
||||||
|
It is estimated that between 46% and 65.5% of human genes could be considered as duplicate genes [cite:@correaTransposableElementEnvironment2021].
|
||||||
|
Duplicate genes offers a pool of genetic material available for further experimentation during species evolution.
|
||||||
|
|
||||||
** Duplication mechanisms
|
** Duplication mechanisms
|
||||||
#+name: fig:gene-duplication-mechanisms
|
#+name: fig:gene-duplication-mechanisms
|
||||||
[[./figures/lallemand2020-fig1_copy.pdf]]
|
#+begin_src emacs-lisp :exports results :results raw
|
||||||
|
(cond
|
||||||
|
((org-export-derived-backend-p org-export-current-backend 'html)
|
||||||
|
"[[./figures/lallemand2020-fig1_copy.svg]]")
|
||||||
|
((org-export-derived-backend-p org-export-current-backend 'latex)
|
||||||
|
"[[./figures/lallemand2020-fig1_copy.pdf]]")
|
||||||
|
(t "[[./figures/lallemand2020-fig1_copy.svg]]"))
|
||||||
|
#+end_src
|
||||||
|
#+caption[Different types of duplications]: Different types of duplications. (A) Whole genome duplication. (B) An unequal crossing-over leads to a duplication of a fragment of a chromosome. (C) In tandem duplication, two (set of) genes are duplicated one after the other. (D) Retrotransposon enables retroduplication: a RNA transcript is reverse transcribed and inserted back without introns and with a polyA tail in the genome. (E) A DNA transposon can acquire a fragment of a gene. (F) Segmental duplication corresponds to long stretches of duplicated sequences with high identity. *Source* Adapted from [cite:@lallemandOverviewDuplicatedGene2020].
|
||||||
|
#+RESULTS: fig:gene-duplication-mechanisms
|
||||||
|
[[./figures/lallemand2020-fig1_copy.svg]]
|
||||||
|
|
||||||
|
# https://stackoverflow.com/questions/13611837/how-can-i-use-different-image-formats-for-different-exports-in-org-mode
|
||||||
|
|
||||||
Multiple mechanisms may lead to gene duplication. We review them in this section.
|
Multiple mechanisms may lead to gene duplication. We review them in this section.
|
||||||
|
|
||||||
|
@ -58,48 +74,51 @@ Multiple mechanisms may lead to gene duplication. We review them in this section
|
||||||
*** Retroduplication
|
*** Retroduplication
|
||||||
Retrotransposons, or RNA transposons are one type of transposable elements. Retrotransposons share similar structure and mechanism with retroviruses.
|
Retrotransposons, or RNA transposons are one type of transposable elements. Retrotransposons share similar structure and mechanism with retroviruses.
|
||||||
They may replicate in the genome through a mechanism known as "copy-and-paste".
|
They may replicate in the genome through a mechanism known as "copy-and-paste".
|
||||||
These transposons are typically composed of a reverse transcriptase gene. This enzyme gene may proceed in the reverse transcription of an mRNA transcript into DNA sequence which can then be inserted elsewhere in the genome.
|
These transposons are typically composed of a reverse transcriptase gene. This enzyme may proceed in the reverse transcription of an mRNA transcript into DNA sequence which can then be inserted elsewhere in the genome.
|
||||||
More generally, retroduplication refers to the duplication of a region in a chromosome through reverse transcription or a transcript.
|
More generally, retroduplication refers to the duplication of a region of a chromosome through reverse transcription or a RNA transcript.
|
||||||
*** Transduplication
|
*** Transduplication
|
||||||
DNA transposons are another type of transposable element whose transposition mechanism can also lead to gene duplication.
|
DNA transposons are another type of transposable element whose transposition mechanism can also lead to gene duplication.
|
||||||
This type of transposable element moves in the genome through a mechanisms known as "cut-and-paste".
|
This type of transposable element moves in the genome through a mechanisms known as "cut-and-paste".
|
||||||
A typical DNA transposon contains a transposase gene. This enzyme recognize two sites surrounding the donnor transposon sequence in the chromosome resulting in a DNA cleavage and excision of the transposon. The transposase can then insert the transposon in a new place of the genome.
|
A typical DNA transposon contains a transposase gene. This enzyme recognize two sites surrounding the donnor transposon sequence in the chromosome resulting in a DNA cleavage and excision of the transposon. The transposase can then insert the transposon in a new place of the genome.
|
||||||
Similarly to retrotransposon, if a gene was present between the two cleavage sites of the donnor transposon, it may move with the transposed sequence.
|
Similarly to retrotransposon, if a gene was present between the two cleavage sites of the donnor transposon, it may move with the transposed sequence.
|
||||||
*** Tandem Duplication
|
*** Tandem Duplication
|
||||||
*** Polyploidisation
|
*** Polyploidisation and Whole Genome Duplication
|
||||||
**** Alloployploidisation
|
In an event of whole genome duplication, the entire set of genes present on the chromosomes is duplicated.
|
||||||
**** Autopolyploidisation
|
Whole genome duplication is more frequent in plants.
|
||||||
**** Polyploidisation mechanisms
|
A striking example is probably the /Triticum/ genus (wheat) in which some species (such as /T. aestivum/) are hexaploid, due to hybridisation events [cite:@golovninaMolecularPhylogenyGenus2007].
|
||||||
***** Polyspermy
|
|
||||||
***** Non-reduced gametes
|
We distinguish two kinds of polyploidisation, based on the origin of the duplicate genome:
|
||||||
|
- Allopolyploidisation occurs when the supplementary chromosomes comes from an other species. This is the case for /Triticum aestivum/ hybridisation.
|
||||||
|
- Autopolyploidisation consist in the hybridisation of the genome within the same species.
|
||||||
|
|
||||||
|
Whole genome duplication can occur thanks to polyspermy or in case of a non-reduced gamete, for instance.
|
||||||
*** Unequal crossing-over
|
*** Unequal crossing-over
|
||||||
A crossing-over may occur during cell division. A fragment of chromosome is exchanged between two chromatids of a pair of chromosome. If the cleavage of the two chromatids occured at different positions on both chromosomes, the shared fragments may have different lengths. When the repair of missing fragment is performed, the resulting chromosome will incorporate a duplicate region of the chromosome, leading to a potential duplication for genes present in this region, as represented in figure [[fig:gene-duplication-mechanisms]].
|
A crossing-over may occur during cell division. A fragment of chromosome is exchanged between two chromatids of a pair of chromosome. If the cleavage of the two chromatids occured at different positions on both chromosomes, the shared fragments may have different lengths. When the repair of missing fragment is performed, the resulting chromosome will incorporate a duplicate region of the chromosome, leading to a potential duplication for genes present in this region, as represented in figure [[fig:gene-duplication-mechanisms]].
|
||||||
This mechanism leads to the duplication of the whole set of genes present in the inserted fragment. These genes are duplicated one after the other in second array of genes placed after the original one and are thus called Tandemly Arrayed Genes.
|
This mechanism leads to the duplication of the whole set of genes present in the inserted fragment. An array of genes is duplicated after the original array and are thus called Tandemly Arrayed Genes.
|
||||||
** Role of duplicate genes in genome evolution
|
** Role of duplicate genes in genome evolution
|
||||||
In his book /Evolution by Gene Duplication/, Susumu \textsc{Ohno} proposed that gene duplication plays a major role in species evolution [cite:@ohnoEvolutionGeneDuplication1970].
|
In his book /Evolution by Gene Duplication/, Susumu [[latex:textsc][Ohno]] proposed that gene duplication plays a major role in species evolution [cite:@ohnoEvolutionGeneDuplication1970].
|
||||||
|
|
||||||
** Methods to identify duplicate genes
|
** Methods to identify duplicate genes
|
||||||
\textsc{Lallemand} et al. review the different methods used to detect duplicate genes. These methods are dependant on the type of duplicate genes they target [cite:@lallemandOverviewDuplicatedGene2020].
|
[[latex:textsc][Lallemand]] et al. review the different methods used to detect duplicate genes. These methods are dependant on the type of duplicate genes they target [cite:@lallemandOverviewDuplicatedGene2020].
|
||||||
|
|
||||||
*** FTAG Finder
|
*** FTAG Finder
|
||||||
Developped in the LaMME laboratory, this pipeline targets the detection of gene family and tandemly arrayed genes from a given species' proteome [cite:@bouillonFTAGFinderOutil].
|
Developped in the LaMME laboratory, this pipeline targets the detection of gene families and tandemly arrayed genes from a given species' proteome [cite:@bouillonFTAGFinderOutil].
|
||||||
|
|
||||||
**** Estimation of homology links between genes
|
**** Estimation of homology links between genes
|
||||||
This steps consists in establishing a relation between each genes in a genome.
|
This steps consists in establishing a relation between each genes in a genome.
|
||||||
In this step, the typical tool involved is =BLAST= (Basic Local Alignment Search Tool) [cite:@altschulBasicLocalAlignment1990] run on the whole proteome.
|
In this step, the typical tool involved is =BLAST= (Basic Local Alignment Search Tool) [cite:@altschulBasicLocalAlignment1990] run on the whole proteome.
|
||||||
|
|
||||||
Several =BLAST= metrics can be used as an homology measure, such as bitscore, identity percentage, E-value or modifications of thoses. The choice of the metrics used may have an impact on the results of graph clustering step [cite:@gibbonsEvaluationBLASTbasedEdgeweighting2015].
|
Several =BLAST= metrics can be used as an homology measure, such as bitscore, identity percentage, E-value or variations on those. The metrics choice may have an impact on the results of graph clustering in the following step [cite:@gibbonsEvaluationBLASTbasedEdgeweighting2015].
|
||||||
**** Identification of gene families
|
**** Identification of gene families
|
||||||
Based on the homology links between each pair of genes, we construct a weighted undirected graph whose vertices corresponds to genes and edges to homology links.
|
Based on the homology links between each pair of genes, we construct a weighted undirected graph whose vertices corresponds to genes and edges to homology links.
|
||||||
Then, a graph clustering algorithm is applied on this graph in order to infer the gene families.
|
Then, a graph clustering algorithm is applied on this graph in order to infer the gene families.
|
||||||
|
|
||||||
The team choosed to propose three clustering algorithms: Single linkage, Markov Clustering or Walktrap.
|
The team chosed to propose three clustering algorithms: Single linkage, Markov Clustering or Walktrap.
|
||||||
|
|
||||||
* Objectives
|
* Objectives
|
||||||
** Extend the existing Galaxy pipeline
|
** Extend the existing Galaxy pipeline
|
||||||
Galaxy is a web-based platform for performing accessible data analysis pipeline, mostly used for genomic data analysis [cite:@goecksGalaxyComprehensiveApproach2010].
|
Galaxy is a web-based platform for performing accessible data analysis pipeline, first designed for use in genomic data analysis [cite:@goecksGalaxyComprehensiveApproach2010].
|
||||||
|
|
||||||
Last year, Séanna \textsc{Charles}, worked on the Galaxy's version of the gls:FTAG Finder pipeline [cite:@charlesFinalisationPipelineFTAG2023] during her M1 intenship. I will continue this work.
|
Last year, Séanna [[latex:textsc][Charles]], worked on the Galaxy's version of the gls:FTAG Finder pipeline during her M1 internship [cite:@charlesFinalisationPipelineFTAG2023]. I will continue this work.
|
||||||
|
|
||||||
** Port FTAG Finder pipeline on a workflow manager
|
** Port FTAG Finder pipeline on a workflow manager
|
||||||
Another objective of my internship will be to port FTAG Finder on a workflow manager better suited to larger and more reproducible analysis.
|
Another objective of my internship will be to port FTAG Finder on a workflow manager better suited to larger and more reproducible analysis.
|
||||||
|
@ -109,10 +128,15 @@ The two main options are Snakemake and Nextflow. Snakemake is a python powered w
|
||||||
|
|
||||||
These tools ease the deployment of large scale data analysis workflow with reproducible output.
|
These tools ease the deployment of large scale data analysis workflow with reproducible output.
|
||||||
|
|
||||||
#+begin_export latex
|
#+begin_export html
|
||||||
\printbibliography
|
<h3>Bibliography</h3>
|
||||||
#+end_export
|
#+end_export
|
||||||
|
|
||||||
|
#+print_bibliography:
|
||||||
|
|
||||||
|
#+begin_export latex
|
||||||
|
\clearpage
|
||||||
|
#+end_export
|
||||||
** Summary
|
** Summary
|
||||||
:PROPERTIES:
|
:PROPERTIES:
|
||||||
:UNNUMBERED: t
|
:UNNUMBERED: t
|
||||||
|
@ -120,7 +144,7 @@ These tools ease the deployment of large scale data analysis workflow with repro
|
||||||
|
|
||||||
|
|
||||||
* Bean :noexport:
|
* Bean :noexport:
|
||||||
|
** MCL
|
||||||
MCL uses two operations on a stochastic matrix representation $M$ of the graph first derived from the adjacency matrix, namely /expansion/ and /inflation/. Expansion consists in elevating the matrix to a power $r$, and subsequently scaling its columns so that they sum to 1 again. The image of the inflation operator $\Gamma_r$ is defined as
|
MCL uses two operations on a stochastic matrix representation $M$ of the graph first derived from the adjacency matrix, namely /expansion/ and /inflation/. Expansion consists in elevating the matrix to a power $r$, and subsequently scaling its columns so that they sum to 1 again. The image of the inflation operator $\Gamma_r$ is defined as
|
||||||
\[
|
\[
|
||||||
(\Gamma_r M)_{pq} = (M_{pq})^r / \sum_{i=1}^m (M_{iq})^r
|
(\Gamma_r M)_{pq} = (M_{pq})^r / \sum_{i=1}^m (M_{iq})^r
|
||||||
|
|
BIN
report.pdf (Stored with Git LFS)
BIN
report.pdf (Stored with Git LFS)
Binary file not shown.
Loading…
Reference in New Issue