feat: Adding some text on duplication mechanisms

This commit is contained in:
Samuel Ortion 2024-03-26 15:16:00 +01:00
parent e16913e3d7
commit 61c504ec61
15 changed files with 622 additions and 35 deletions

1
.gitattributes vendored
View File

@ -1 +1,2 @@
main.pdf filter=lfs diff=lfs merge=lfs -text
*.pdf filter=lfs diff=lfs merge=lfs -text

View File

@ -1,6 +1,5 @@
OPTIONS=-shell-escape -file-line-error -synctex=1
SOURCE=main
SOURCE=report
all: latexmk bib glossaries latexmk
build:

BIN
figures/lallemand2020-fig1_copy.pdf (Stored with Git LFS) Normal file

Binary file not shown.

View File

@ -0,0 +1,438 @@
<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!-- Created with Inkscape (http://www.inkscape.org/) -->
<svg
width="210mm"
height="297mm"
viewBox="0 0 210 297"
version="1.1"
id="svg1"
inkscape:version="1.3.2 (091e20ef0f, 2023-11-25)"
sodipodi:docname="lallemand2020-fig1_copy.svg"
inkscape:export-filename="lallemand2020-fig1_copy.pdf"
inkscape:export-xdpi="96"
inkscape:export-ydpi="96"
xmlns:inkscape="http://www.inkscape.org/namespaces/inkscape"
xmlns:sodipodi="http://sodipodi.sourceforge.net/DTD/sodipodi-0.dtd"
xmlns="http://www.w3.org/2000/svg"
xmlns:svg="http://www.w3.org/2000/svg">
<sodipodi:namedview
id="namedview1"
pagecolor="#ffffff"
bordercolor="#000000"
borderopacity="0.25"
inkscape:showpageshadow="2"
inkscape:pageopacity="0.0"
inkscape:pagecheckerboard="0"
inkscape:deskcolor="#d1d1d1"
inkscape:document-units="mm"
showgrid="true"
inkscape:zoom="1.0356019"
inkscape:cx="479.43132"
inkscape:cy="362.10825"
inkscape:window-width="1920"
inkscape:window-height="1008"
inkscape:window-x="0"
inkscape:window-y="0"
inkscape:window-maximized="1"
inkscape:current-layer="g40">
<inkscape:grid
id="grid2"
units="mm"
originx="0"
originy="0"
spacingx="0.99999998"
spacingy="1"
empcolor="#0099e5"
empopacity="0.30196078"
color="#0099e5"
opacity="0.14901961"
empspacing="5"
dotted="false"
gridanglex="30"
gridanglez="30"
visible="true" />
</sodipodi:namedview>
<defs
id="defs1">
<marker
style="overflow:visible"
id="ArrowTriangleStylized"
refX="0"
refY="0"
orient="auto-start-reverse"
inkscape:stockid="Stylized triangle arrow"
markerWidth="1"
markerHeight="1"
viewBox="0 0 1 1"
inkscape:isstock="true"
inkscape:collect="always"
preserveAspectRatio="xMidYMid">
<path
transform="scale(0.5)"
style="fill:context-stroke;fill-rule:evenodd;stroke:context-stroke;stroke-width:1pt"
d="m 6,0 c -3,1 -7,3 -9,5 0,0 0,-4 2,-5 -2,-1 -2,-5 -2,-5 2,2 6,4 9,5 z"
id="path4" />
</marker>
</defs>
<g
inkscape:label="Layer 1"
inkscape:groupmode="layer"
id="layer1">
<text
xml:space="preserve"
style="font-size:4.23333px;font-family:'Latin Modern Roman';-inkscape-font-specification:'Latin Modern Roman, Normal';fill:none;fill-opacity:0.913725;stroke:#cccccc;stroke-width:1"
x="21.964703"
y="25"
id="text1"><tspan
sodipodi:role="line"
id="tspan1"
style="fill:#000000;stroke:none;stroke-width:1"
x="21.964703"
y="25">A</tspan></text>
<g
id="g7"
transform="translate(8.6387193,3.9999999)"
style="stroke:#0000ff">
<circle
style="fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none"
id="path2"
cx="53.232861"
cy="35.984467"
r="14.015532"
transform="translate(-8.6387193,-3.9999999)" />
<g
id="g4"
style="stroke:#0000ff"
transform="translate(-11.149481,-3.9999999)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1;stroke-dasharray:none"
d="m 46.626465,29.999998 c 0.230253,1.609669 0.884298,5.000001 0.884298,5.000001 0,0 -0.617872,3.263792 -0.884298,5"
id="path3"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1;stroke-dasharray:none"
d="m 49.000001,29.999999 -0.638719,5 L 49.000001,40"
id="path3-1"
sodipodi:nodetypes="ccc" />
</g>
<g
id="g4-6"
style="stroke:#0000ff"
transform="translate(-6.7900835,-4.0025177)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1;stroke-dasharray:none"
d="m 46.626465,29.999998 c 0.230253,1.609669 0.884298,5.000001 0.884298,5.000001 0,0 -0.617872,3.263792 -0.884298,5"
id="path3-5"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1;stroke-dasharray:none"
d="m 49.000001,29.999999 -0.638719,5 L 49.000001,40"
id="path3-1-6"
sodipodi:nodetypes="ccc" />
</g>
<g
id="g5"
style="stroke:#ff6600">
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff6600;stroke-width:1;stroke-dasharray:none"
d="m 47.169376,32.256753 c 0.230253,1.609669 0.341387,2.743246 0.341387,2.743246 0,0 -0.266577,1.826675 -0.533003,3.562883"
id="path3-5-3"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff6600;stroke-width:1;stroke-dasharray:none"
d="m 48.936129,32.363258 -0.574847,2.636741 0.606783,3.638722"
id="path3-1-6-8"
sodipodi:nodetypes="ccc" />
</g>
<g
id="g6"
transform="translate(3.6966086,0.18063894)"
style="stroke:#ff6600">
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff6600;stroke-width:1;stroke-dasharray:none"
d="m 47.169376,32.256753 c 0.230253,1.609669 0.341387,2.743246 0.341387,2.743246 0,0 -0.266577,1.826675 -0.533003,3.562883"
id="path5"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff6600;stroke-width:1;stroke-dasharray:none"
d="m 48.936129,32.363258 -0.574847,2.636741 0.606783,3.638722"
id="path6"
sodipodi:nodetypes="ccc" />
</g>
</g>
<g
id="g15"
transform="translate(80.405862,4.0000004)"
style="stroke:#0000ff">
<g
id="g23"
transform="translate(17.616381,0.32044963)">
<circle
style="fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none"
id="circle7"
cx="53.232861"
cy="35.984467"
r="14.015532"
transform="translate(-8.6387193,-3.9999999)" />
<g
id="g8"
style="stroke:#0000ff"
transform="translate(-9.5619803,-8.2333335)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1;stroke-dasharray:none"
d="m 46.626465,29.999998 c 0.230253,1.609669 0.884298,5.000001 0.884298,5.000001 0,0 -0.617872,3.263792 -0.884298,5"
id="path7"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1;stroke-dasharray:none"
d="m 49.000001,29.999999 -0.638719,5 L 49.000001,40"
id="path8"
sodipodi:nodetypes="ccc" />
</g>
<g
id="g10"
style="stroke:#0000ff"
transform="translate(-5.2025834,-8.2358513)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1;stroke-dasharray:none"
d="m 46.626465,29.999998 c 0.230253,1.609669 0.884298,5.000001 0.884298,5.000001 0,0 -0.617872,3.263792 -0.884298,5"
id="path9"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1;stroke-dasharray:none"
d="m 49.000001,29.999999 -0.638719,5 L 49.000001,40"
id="path10"
sodipodi:nodetypes="ccc" />
</g>
<g
id="g12"
style="stroke:#ff9f00;stroke-opacity:1"
transform="translate(0,2.1166667)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff9f00;stroke-width:1;stroke-dasharray:none;stroke-opacity:1"
d="m 47.169376,32.256753 c 0.230253,1.609669 0.341387,2.743246 0.341387,2.743246 0,0 -0.266577,1.826675 -0.533003,3.562883"
id="path11"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff9f00;stroke-width:1;stroke-dasharray:none;stroke-opacity:1"
d="m 48.936129,32.363258 -0.574847,2.636741 0.606783,3.638722"
id="path12"
sodipodi:nodetypes="ccc" />
</g>
<g
id="g14"
transform="translate(3.6966086,2.2973057)"
style="stroke:#ff9f00;stroke-opacity:1">
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff9f00;stroke-width:1;stroke-dasharray:none;stroke-opacity:1"
d="m 47.169376,32.256753 c 0.230253,1.609669 0.341387,2.743246 0.341387,2.743246 0,0 -0.266577,1.826675 -0.533003,3.562883"
id="path13"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff9f00;stroke-width:1;stroke-dasharray:none;stroke-opacity:1"
d="m 48.936129,32.363258 -0.574847,2.636741 0.606783,3.638722"
id="path14"
sodipodi:nodetypes="ccc" />
</g>
<g
id="g16"
style="stroke:#008eff;stroke-opacity:1"
transform="translate(-9.5619803,2.879167)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#008eff;stroke-width:1;stroke-dasharray:none;stroke-opacity:1"
d="m 46.626465,29.999998 c 0.230253,1.609669 0.884298,5.000001 0.884298,5.000001 0,0 -0.617872,3.263792 -0.884298,5"
id="path15"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#008eff;stroke-width:1;stroke-dasharray:none;stroke-opacity:1"
d="m 49.000001,29.999999 -0.638719,5 L 49.000001,40"
id="path16"
sodipodi:nodetypes="ccc" />
</g>
<g
id="g18"
style="stroke:#008eff;stroke-opacity:1"
transform="translate(-5.2025834,2.8766492)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#008eff;stroke-width:1;stroke-dasharray:none;stroke-opacity:1"
d="m 46.626465,29.999998 c 0.230253,1.609669 0.884298,5.000001 0.884298,5.000001 0,0 -0.617872,3.263792 -0.884298,5"
id="path17"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#008eff;stroke-width:1;stroke-dasharray:none;stroke-opacity:1"
d="m 49.000001,29.999999 -0.638719,5 L 49.000001,40"
id="path18"
sodipodi:nodetypes="ccc" />
</g>
<g
id="g20"
style="stroke:#ff6600"
transform="translate(0,-8.4666671)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff6600;stroke-width:1;stroke-dasharray:none"
d="m 47.169376,32.256753 c 0.230253,1.609669 0.341387,2.743246 0.341387,2.743246 0,0 -0.266577,1.826675 -0.533003,3.562883"
id="path19"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff6600;stroke-width:1;stroke-dasharray:none"
d="m 48.936129,32.363258 -0.574847,2.636741 0.606783,3.638722"
id="path20"
sodipodi:nodetypes="ccc" />
</g>
<g
id="g22"
transform="translate(3.6966086,-8.2860282)"
style="stroke:#ff6600">
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff6600;stroke-width:1;stroke-dasharray:none"
d="m 47.169376,32.256753 c 0.230253,1.609669 0.341387,2.743246 0.341387,2.743246 0,0 -0.266577,1.826675 -0.533003,3.562883"
id="path21"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff6600;stroke-width:1;stroke-dasharray:none"
d="m 48.936129,32.363258 -0.574847,2.636741 0.606783,3.638722"
id="path22"
sodipodi:nodetypes="ccc" />
</g>
</g>
<path
style="fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none;stroke-opacity:1;marker-end:url(#ArrowTriangleStylized)"
d="m 4.5617219,30.997399 25.0324191,0.0026"
id="path23" />
<text
xml:space="preserve"
style="font-size:4.23333px;font-family:'Latin Modern Roman';-inkscape-font-specification:'Latin Modern Roman, Normal';fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none;stroke-opacity:1"
x="-5.320653"
y="25.072666"
id="text23"><tspan
sodipodi:role="line"
id="tspan23"
style="fill:#000000;stroke:none;stroke-width:1"
x="-5.320653"
y="25.072666">whole genome duplication</tspan></text>
<path
style="fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none;stroke-opacity:1;marker-end:url(#ArrowTriangleStylized)"
d="m 4.8701727,100.96179 25.0324193,0.003"
id="path24" />
</g>
<text
xml:space="preserve"
style="font-size:4.23333px;font-family:'Latin Modern Roman';-inkscape-font-specification:'Latin Modern Roman, Normal';fill:#000000;fill-opacity:0.913725;stroke-width:1"
x="20"
y="65"
id="text2"><tspan
sodipodi:role="line"
id="tspan2"
style="stroke-width:1"
x="20"
y="65">B</tspan></text>
<text
xml:space="preserve"
style="font-size:4.23333px;font-family:'Latin Modern Roman';-inkscape-font-specification:'Latin Modern Roman, Normal';fill:#000000;fill-opacity:0.913725;stroke-width:1"
x="80.6063"
y="99.027908"
id="text3"><tspan
sodipodi:role="line"
id="tspan3"
style="stroke-width:1"
x="80.6063"
y="99.027908">unequal crossing-over</tspan></text>
<path
style="fill:none;fill-opacity:0.913725;stroke:#ffaaaa;stroke-width:1"
d="m 44.960266,113.25722 0.03973,8.74277"
id="path36" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1"
d="m 44.868446,93.051087 0.09182,20.206133"
id="path25" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ffaaaa;stroke-width:1"
d="m 54.866979,113.92631 0.01262,8.07595"
id="path32"
sodipodi:nodetypes="cc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1"
d="m 50.000001,92.999997 v 4 c 1e-6,9.000003 5.188809,4.505713 4.866978,16.926313"
id="path26"
sodipodi:nodetypes="csc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff0000;stroke-width:1"
d="m 51.002359,106.37341 c -0.500431,1.23589 -0.794678,3.15897 -0.682998,7.26333"
id="path33" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1"
d="m 54.922619,84.055247 -0.273915,12.94475 c -1.07215,7.153293 -2.715748,7.075173 -3.646345,9.373413"
id="path27" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff0000;stroke-width:1"
d="m 60.053664,104.08938 -0.10732,7.82124"
id="path29"
sodipodi:nodetypes="cc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1"
d="m 60.214294,84.055247 -0.16063,20.034133"
id="path28"
sodipodi:nodetypes="cc" />
<g
id="g40"
transform="translate(-15.287297,-0.01996951)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#ffaaaa;stroke-width:1"
d="m 145.33224,111.9049 0.0417,9.17903"
id="path37" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1"
d="m 145.2424,92.135035 0.0898,19.769865"
id="path38" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ffaaaa;stroke-width:1;stroke-dasharray:1, 1;stroke-dashoffset:0"
d="m 150.00669,111.9049 0.0417,9.17903"
id="path46" />
</g>
<g
id="g41"
transform="translate(-15.297386,-0.0183055)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff0000;stroke-width:1"
d="m 150.00494,101.6855 0.002,10.2194"
id="path39"
sodipodi:nodetypes="cc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1"
d="m 150.00493,92.135035 1e-5,9.550465"
id="path40"
sodipodi:nodetypes="cc" />
</g>
<g
id="g42"
transform="translate(8.7127035,-0.01997038)">
<path
style="fill:#ff0000;fill-opacity:0.913725;stroke:#ffaaaa;stroke-width:1"
d="m 145.33224,123.01747 0.0417,9.17903"
id="path41" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1"
d="m 145.2424,92.135035 0.0898,30.882435"
id="path42"
sodipodi:nodetypes="cc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ffaaaa;stroke-width:1;stroke-dasharray:1,1;stroke-dashoffset:0"
d="m 150.09477,123.01747 0.0417,9.17903"
id="path45" />
</g>
<g
id="g44"
transform="translate(8.7127035,-0.01997038)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff0000;stroke-width:1"
d="m 150.09129,113.25497 0.0452,9.94564"
id="path43" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1"
d="m 150.00493,92.135035 0.0864,21.119935"
id="path44"
sodipodi:nodetypes="cc" />
</g>
</g>
</svg>

After

Width:  |  Height:  |  Size: 18 KiB

View File

@ -1 +0,0 @@
\newabbreviation{TAG}{TAGs}{Tandem Arrayed Genes}

BIN
main.pdf (Stored with Git LFS)

Binary file not shown.

Binary file not shown.

Binary file not shown.

Binary file not shown.

View File

@ -1,44 +1,92 @@
#+title: Further development on FTAG Finder, a pipeline to identify Tandem Arrayed Genes
#+subtitle: Scientific project
#+title: Further development on Finder, a pipeline to identify Tandem Arrayed Genes
#+author: Samuel Ortion
#+date: 2023-2024
#+LATEX_CLASS: lamme2024
#+LATEX_CLASS: scientific-project
#+LATEX_HEADER: \usepackage{sty/lamme2024}
#+latex_header_extra: \newglossaryentry{LaMME}{name={LaMME},description={Laboratoire de Mathématiques et Modélisation d'Évry}}
#+bibliography: ../references.bib
#+exclude_tags: noexport
#+options: H:7
#+options: toc:nil
# ref. https://write.as/dani/writing-a-phd-thesis-with-org-mode
#+name: acronyms
| key | abbreviation | full form |
|-----+--------------+---------------------|
| TAG | TAG | Tandem Arrayed Gene |
| FTAG | FTAG | Families and Tandem Arrayed Gene |
#+begin_export latex
\hypersetup{
pdfauthor={Samuel Ortion},
pdftitle={},
pdfkeywords={duplicate genes, workflow management systems, pipeline},
pdfsubject={},
pdflang={English}}
{
\pagenumbering{roman}
\hypersetup{hidelinks}
\tableofcontents
\printglossaries
}
\pagenumbering{roman}
#+end_export
#+begin_abstract
Duplicate genes is an important component of genomes. They have a particular role in genome evolution, allowing species to explore new gene functionality offering a pool of usable genes to build on.
TODO:
#+end_abstract
#+begin_center
duplicate genes, tandem arrayed genes, pipeline
*keywords*: duplicate genes, tandem arrayed genes, pipeline
#+end_center
#+begin_export latex
\tableofcontents
#+end_export
[[printglossaries:]]
#+begin_export latex
\pagenumbering{arabic}
#+end_export
* Context
** Duplicate genes
*** Duplication mechanism
** What are duplicate genes?
Duplicate genes are genes that experienced a duplication event during species evolution.
These are homologous genes.
*** Duplication mechanisms
#+name: fig:gene-duplication-mechanisms
#+CAPTION: Mechanisms leading to gene duplication
[[./figures/lallemand2020-fig1_copy.pdf]]
Several mechanisms may lead to gene duplication. We review them in this section.
**** Segment duplication
**** Retroduplication
Transposable elements cause an important part of gene duplication [citation needed]
Retrotransposon, or RNA transposon is one type of transposable element. Some of the representant of retrotransposon are similar to retroviruses.
Retrotransposon may be duplicated in the genome through a mechanism known as "copy-and-paste".
These transposons are typically composed of a reverse transcriptase gene. The protein encoded by this gene may proceed in the reverse transcription of the RNA transcript of the transposon sequence resulting in a DNA sequence which can then be included elsewhere in the genome.
During this process, the RNA transcript may include nearby gene sequence, which can thus be copied and pasted along with the retrotransposon.
**** Transduplication
DNA transposon is an other type of transposable element whose transposition mechanisms can lead to gene duplication too.
This type of transposable element moves in the genome through a mechanisms known as "cut-and-paste".
The typical DNA transposon contains a transposase gene. The protein encoded by this gene recognize two sites surrounding the donnor transposon sequence in the chromosome resulting in a DNA cleavage. The transposase can then insert the transposon in a new place of the genome.
Similarly to retrotransposon, if a gene was present between the two cleavage sites of the donnor transposon, it may move with the transposed sequence.
**** Tandem Duplication
**** Polyploidisation
***** Alloployploïdisation
***** Autopolyploïdisation
***** Mechanisms
****** Polyspermy
****** Non-reduced gametes
**** Unequal crossing-over
A crossing-over may occur during cell division. A fragment of chromosome is exchanged between two chromatids of a pair of chromosome. If the cleavage of the two chromatids occured at different positions on both chromosomes, the shared fragments may have different lengths. When the repair of missing fragment is performed, the resulting chromosome will incorporate a duplicate region of the chromosome, leading to a potential duplication for genes present in this region, as represented in figure [[fig:gene-duplication-mechanisms]] B. # TODO: check that this is really the B subfigure
*** Role in genome evolution
** Identification of duplicate genes
** FTAG Finder, a method to identify Families and Tandem Arrayed Genes
***
*** Finder
* Objectives
** Amend the existing Galaxy pipeline
Last year, a M1 student, Seanna Charles, worked on the Galaxy's version of the gls: Finder pipeline [cite:@charlesFinalisationPipelineFTAG2023].
During my internship, I will continue this work.
** Porting Finder pipeline on a workflow manager
* Tips :noexport:
To export:
C-c C-e C-b l l
#+begin_export latex
\printbibliography
#+end_export

Binary file not shown.

View File

@ -1,14 +1,21 @@
% Created 2024-03-21 Thu 19:34
% Created 2024-03-26 Tue 15:13
% Intended LaTeX compiler: lualatex
\documentclass{scrreprt}
\usepackage{sty/lamme2024}
\documentclass{scrbook}
\usepackage{sty/lamme2024}
\newacronym{TAG}{TAG}{Tandem Arrayed Gene}
\newacronym{FTAG}{FTAG}{Families and Tandem Arrayed Gene}
\newglossaryentry{LaMME}{name={LaMME},description={Laboratoire de Mathématiques et Modélisation d'Évry}}
\makeindex
\makeglossaries
\usepackage{minted}
\author{Samuel Ortion}
\date{2023-2024}
\title{Further development on FTAG Finder, a pipeline to identify Tandem Arrayed Genes\\\medskip
\large Scientific project}
\title{Further development on Finder, a pipeline to identify Tandem Arrayed Genes}
\hypersetup{
pdfauthor={Samuel Ortion},
pdftitle={Further development on FTAG Finder, a pipeline to identify Tandem Arrayed Genes},
pdftitle={Further development on Finder, a pipeline to identify Tandem Arrayed Genes},
pdfkeywords={},
pdfsubject={},
pdfcreator={Emacs 29.2 (Org mode 9.7)},
@ -18,6 +25,87 @@
\begin{document}
\maketitle
\hypersetup{
pdfauthor={Samuel Ortion},
pdftitle={},
pdfkeywords={duplicate genes, workflow management systems, pipeline},
}
\pagenumbering{roman}
\begin{abstract}
Duplicate genes is an important component of genomes. They have a particular role in genome evolution, allowing species to explore new gene functionality offering a pool of usable genes to build on.
TODO:
\end{abstract}
\begin{center}
\textbf{keywords}: duplicate genes, tandem arrayed genes, pipeline
\end{center}
\tableofcontents
\printglossaries
\pagenumbering{arabic}
\part{Context}
\label{sec:org8d0fa24}
\chapter{What are duplicate genes?}
\label{sec:orgee68751}
Duplicate genes are genes that experienced a duplication event during species evolution.
These are homologous genes.
\section{Duplication mechanisms}
\label{sec:orgcf44cad}
\begin{center}
\includegraphics[width=.9\linewidth]{./figures/lallemand2020-fig1_copy.pdf}
\caption{\label{fig:gene-duplication-mechanisms}Mechanisms leading to gene duplication}
\end{center}
Several mechanisms may lead to gene duplication. We review them in this section.
\subsection{Segment duplication}
\label{sec:org922a1dd}
\subsection{Retroduplication}
\label{sec:orgd8f7e18}
Transposable elements cause an important part of gene duplication [citation needed]
Retrotransposon, or RNA transposon is one type of transposable element. Some of the representant of retrotransposon are similar to retroviruses.
Retrotransposon may be duplicated in the genome through a mechanism known as ``copy-and-paste''.
These transposons are typically composed of a reverse transcriptase gene. The protein encoded by this gene may proceed in the reverse transcription of the RNA transcript of the transposon sequence resulting in a DNA sequence which can then be included elsewhere in the genome.
During this process, the RNA transcript may include nearby gene sequence, which can thus be copied and pasted along with the retrotransposon.
\subsection{Transduplication}
\label{sec:org74a527a}
DNA transposon is an other type of transposable element whose transposition mechanisms can lead to gene duplication too.
This type of transposable element moves in the genome through a mechanisms known as ``cut-and-paste''.
The typical DNA transposon contains a transposase gene. The protein encoded by this gene recognize two sites surrounding the donnor transposon sequence in the chromosome resulting in a DNA cleavage. The transposase can then insert the transposon in a new place of the genome.
Similarly to retrotransposon, if a gene was present between the two cleavage sites of the donnor transposon, it may move with the transposed sequence.
\subsection{Tandem Duplication}
\label{sec:org1185c12}
\subsection{Polyploidisation}
\label{sec:org349eaa4}
\subsubsection{Alloployploïdisation}
\label{sec:org323512f}
\subsubsection{Autopolyploïdisation}
\label{sec:orgba5b73e}
\subsubsection{Mechanisms}
\label{sec:orga1009de}
\paragraph{Polyspermy}
\label{sec:orgee32a5c}
\paragraph{Non-reduced gametes}
\label{sec:org3297de6}
\subsection{Unequal crossing-over}
\label{sec:org31e5f76}
A crossing-over may occur during cell division. A fragment of chromosome is exchanged between two chromatids of a pair of chromosome. If the cleavage of the two chromatids occured at different positions on both chromosomes, the shared fragments may have different lengths. When the repair of missing fragment is performed, the resulting chromosome will incorporate a duplicate region of the chromosome, leading to a potential duplication for genes present in this region, as represented in figure \ref{fig:gene-duplication-mechanisms} B. \# TODO: check that this is really the B subfigure
\section{Role in genome evolution}
\label{sec:orga7bdfd9}
\chapter{Identification of duplicate genes}
\label{sec:org3aec87b}
\textbf{*}
\section{Finder}
\label{sec:org9b93040}
\part{Objectives}
\label{sec:org1b30340}
\chapter{Amend the existing Galaxy pipeline}
\label{sec:orgf108b0f}
Last year, a M1 student, Seanna Charles, worked on the Galaxy's version of the gls: Finder pipeline \autocite{charlesFinalisationPipelineFTAG2023}.
During my internship, I will continue this work.
\chapter{Porting Finder pipeline on a workflow manager}
\label{sec:orgd5c8063}
\printbibliography
\end{document}

View File

@ -65,3 +65,16 @@
\makeglossaries
\makeindex
\renewcommand\maketitle{\include{titlepage}}
% Abstract
\providecommand{\abstractname}{Abstract} % not in scrbook class
\newenvironment{abstract}[1]{%
\hrule
\small\textbf{\abstractname: }
%\small\emph #1 % emph takes an argument
\small\emph{#1} % or \small\textit{#1}
\itshape % use this if you want the text to be in italics
}{%
\newline\hrule
\vspace{0.6cm}
}

Binary file not shown.

View File

@ -13,13 +13,14 @@
\vfill
\Large Samuel ORTION \orcidlink{0009-0001-0971-497X}
\Large Samuel ORTION \orcidlink{0009-0001-0971-497X}
\vfill
\LARGE
Development of a Nextflow\footnote{We still need to decide which workflow manager to choose: Nextflow or Snakemake} pipeline for FTAG Finder, a duplicate gene detection tool, and improvement of the existing Galaxy implementation
\makeatletter
\@title
\makeatother
\vfill
\normalsize