Compare commits

..

2 Commits

Author SHA1 Message Date
Samuel Ortion 61c504ec61 feat: Adding some text on duplication mechanisms 2024-03-26 15:16:00 +01:00
Samuel Ortion e16913e3d7 Migrating to org-mode 2024-03-21 19:36:09 +01:00
19 changed files with 740 additions and 29 deletions

2
.gitattributes vendored Normal file
View File

@ -0,0 +1,2 @@
main.pdf filter=lfs diff=lfs merge=lfs -text
*.pdf filter=lfs diff=lfs merge=lfs -text

View File

@ -1,3 +1,9 @@
sub createFolderStructure{
system("bash ./folder-structure.sh");
}
createFolderStructure();
$hash_calc_ignore_pattern{aux} = $hash_calc_ignore_pattern{aux} =
'^\\\\gdef\\\\minted@oldcachelist\{,' '^\\\\gdef\\\\minted@oldcachelist\{,'
. '|^\s*default\.pygstyle,' . '|^\s*default\.pygstyle,'

View File

@ -1,6 +1,5 @@
OPTIONS=-shell-escape -file-line-error -synctex=1 OPTIONS=-shell-escape -file-line-error -synctex=1
SOURCE=main SOURCE=report
all: latexmk bib glossaries latexmk all: latexmk bib glossaries latexmk
build: build:

BIN
figures/lallemand2020-fig1_copy.pdf (Stored with Git LFS) Normal file

Binary file not shown.

View File

@ -0,0 +1,438 @@
<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!-- Created with Inkscape (http://www.inkscape.org/) -->
<svg
width="210mm"
height="297mm"
viewBox="0 0 210 297"
version="1.1"
id="svg1"
inkscape:version="1.3.2 (091e20ef0f, 2023-11-25)"
sodipodi:docname="lallemand2020-fig1_copy.svg"
inkscape:export-filename="lallemand2020-fig1_copy.pdf"
inkscape:export-xdpi="96"
inkscape:export-ydpi="96"
xmlns:inkscape="http://www.inkscape.org/namespaces/inkscape"
xmlns:sodipodi="http://sodipodi.sourceforge.net/DTD/sodipodi-0.dtd"
xmlns="http://www.w3.org/2000/svg"
xmlns:svg="http://www.w3.org/2000/svg">
<sodipodi:namedview
id="namedview1"
pagecolor="#ffffff"
bordercolor="#000000"
borderopacity="0.25"
inkscape:showpageshadow="2"
inkscape:pageopacity="0.0"
inkscape:pagecheckerboard="0"
inkscape:deskcolor="#d1d1d1"
inkscape:document-units="mm"
showgrid="true"
inkscape:zoom="1.0356019"
inkscape:cx="479.43132"
inkscape:cy="362.10825"
inkscape:window-width="1920"
inkscape:window-height="1008"
inkscape:window-x="0"
inkscape:window-y="0"
inkscape:window-maximized="1"
inkscape:current-layer="g40">
<inkscape:grid
id="grid2"
units="mm"
originx="0"
originy="0"
spacingx="0.99999998"
spacingy="1"
empcolor="#0099e5"
empopacity="0.30196078"
color="#0099e5"
opacity="0.14901961"
empspacing="5"
dotted="false"
gridanglex="30"
gridanglez="30"
visible="true" />
</sodipodi:namedview>
<defs
id="defs1">
<marker
style="overflow:visible"
id="ArrowTriangleStylized"
refX="0"
refY="0"
orient="auto-start-reverse"
inkscape:stockid="Stylized triangle arrow"
markerWidth="1"
markerHeight="1"
viewBox="0 0 1 1"
inkscape:isstock="true"
inkscape:collect="always"
preserveAspectRatio="xMidYMid">
<path
transform="scale(0.5)"
style="fill:context-stroke;fill-rule:evenodd;stroke:context-stroke;stroke-width:1pt"
d="m 6,0 c -3,1 -7,3 -9,5 0,0 0,-4 2,-5 -2,-1 -2,-5 -2,-5 2,2 6,4 9,5 z"
id="path4" />
</marker>
</defs>
<g
inkscape:label="Layer 1"
inkscape:groupmode="layer"
id="layer1">
<text
xml:space="preserve"
style="font-size:4.23333px;font-family:'Latin Modern Roman';-inkscape-font-specification:'Latin Modern Roman, Normal';fill:none;fill-opacity:0.913725;stroke:#cccccc;stroke-width:1"
x="21.964703"
y="25"
id="text1"><tspan
sodipodi:role="line"
id="tspan1"
style="fill:#000000;stroke:none;stroke-width:1"
x="21.964703"
y="25">A</tspan></text>
<g
id="g7"
transform="translate(8.6387193,3.9999999)"
style="stroke:#0000ff">
<circle
style="fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none"
id="path2"
cx="53.232861"
cy="35.984467"
r="14.015532"
transform="translate(-8.6387193,-3.9999999)" />
<g
id="g4"
style="stroke:#0000ff"
transform="translate(-11.149481,-3.9999999)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1;stroke-dasharray:none"
d="m 46.626465,29.999998 c 0.230253,1.609669 0.884298,5.000001 0.884298,5.000001 0,0 -0.617872,3.263792 -0.884298,5"
id="path3"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1;stroke-dasharray:none"
d="m 49.000001,29.999999 -0.638719,5 L 49.000001,40"
id="path3-1"
sodipodi:nodetypes="ccc" />
</g>
<g
id="g4-6"
style="stroke:#0000ff"
transform="translate(-6.7900835,-4.0025177)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1;stroke-dasharray:none"
d="m 46.626465,29.999998 c 0.230253,1.609669 0.884298,5.000001 0.884298,5.000001 0,0 -0.617872,3.263792 -0.884298,5"
id="path3-5"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1;stroke-dasharray:none"
d="m 49.000001,29.999999 -0.638719,5 L 49.000001,40"
id="path3-1-6"
sodipodi:nodetypes="ccc" />
</g>
<g
id="g5"
style="stroke:#ff6600">
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff6600;stroke-width:1;stroke-dasharray:none"
d="m 47.169376,32.256753 c 0.230253,1.609669 0.341387,2.743246 0.341387,2.743246 0,0 -0.266577,1.826675 -0.533003,3.562883"
id="path3-5-3"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff6600;stroke-width:1;stroke-dasharray:none"
d="m 48.936129,32.363258 -0.574847,2.636741 0.606783,3.638722"
id="path3-1-6-8"
sodipodi:nodetypes="ccc" />
</g>
<g
id="g6"
transform="translate(3.6966086,0.18063894)"
style="stroke:#ff6600">
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff6600;stroke-width:1;stroke-dasharray:none"
d="m 47.169376,32.256753 c 0.230253,1.609669 0.341387,2.743246 0.341387,2.743246 0,0 -0.266577,1.826675 -0.533003,3.562883"
id="path5"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff6600;stroke-width:1;stroke-dasharray:none"
d="m 48.936129,32.363258 -0.574847,2.636741 0.606783,3.638722"
id="path6"
sodipodi:nodetypes="ccc" />
</g>
</g>
<g
id="g15"
transform="translate(80.405862,4.0000004)"
style="stroke:#0000ff">
<g
id="g23"
transform="translate(17.616381,0.32044963)">
<circle
style="fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none"
id="circle7"
cx="53.232861"
cy="35.984467"
r="14.015532"
transform="translate(-8.6387193,-3.9999999)" />
<g
id="g8"
style="stroke:#0000ff"
transform="translate(-9.5619803,-8.2333335)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1;stroke-dasharray:none"
d="m 46.626465,29.999998 c 0.230253,1.609669 0.884298,5.000001 0.884298,5.000001 0,0 -0.617872,3.263792 -0.884298,5"
id="path7"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1;stroke-dasharray:none"
d="m 49.000001,29.999999 -0.638719,5 L 49.000001,40"
id="path8"
sodipodi:nodetypes="ccc" />
</g>
<g
id="g10"
style="stroke:#0000ff"
transform="translate(-5.2025834,-8.2358513)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1;stroke-dasharray:none"
d="m 46.626465,29.999998 c 0.230253,1.609669 0.884298,5.000001 0.884298,5.000001 0,0 -0.617872,3.263792 -0.884298,5"
id="path9"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1;stroke-dasharray:none"
d="m 49.000001,29.999999 -0.638719,5 L 49.000001,40"
id="path10"
sodipodi:nodetypes="ccc" />
</g>
<g
id="g12"
style="stroke:#ff9f00;stroke-opacity:1"
transform="translate(0,2.1166667)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff9f00;stroke-width:1;stroke-dasharray:none;stroke-opacity:1"
d="m 47.169376,32.256753 c 0.230253,1.609669 0.341387,2.743246 0.341387,2.743246 0,0 -0.266577,1.826675 -0.533003,3.562883"
id="path11"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff9f00;stroke-width:1;stroke-dasharray:none;stroke-opacity:1"
d="m 48.936129,32.363258 -0.574847,2.636741 0.606783,3.638722"
id="path12"
sodipodi:nodetypes="ccc" />
</g>
<g
id="g14"
transform="translate(3.6966086,2.2973057)"
style="stroke:#ff9f00;stroke-opacity:1">
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff9f00;stroke-width:1;stroke-dasharray:none;stroke-opacity:1"
d="m 47.169376,32.256753 c 0.230253,1.609669 0.341387,2.743246 0.341387,2.743246 0,0 -0.266577,1.826675 -0.533003,3.562883"
id="path13"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff9f00;stroke-width:1;stroke-dasharray:none;stroke-opacity:1"
d="m 48.936129,32.363258 -0.574847,2.636741 0.606783,3.638722"
id="path14"
sodipodi:nodetypes="ccc" />
</g>
<g
id="g16"
style="stroke:#008eff;stroke-opacity:1"
transform="translate(-9.5619803,2.879167)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#008eff;stroke-width:1;stroke-dasharray:none;stroke-opacity:1"
d="m 46.626465,29.999998 c 0.230253,1.609669 0.884298,5.000001 0.884298,5.000001 0,0 -0.617872,3.263792 -0.884298,5"
id="path15"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#008eff;stroke-width:1;stroke-dasharray:none;stroke-opacity:1"
d="m 49.000001,29.999999 -0.638719,5 L 49.000001,40"
id="path16"
sodipodi:nodetypes="ccc" />
</g>
<g
id="g18"
style="stroke:#008eff;stroke-opacity:1"
transform="translate(-5.2025834,2.8766492)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#008eff;stroke-width:1;stroke-dasharray:none;stroke-opacity:1"
d="m 46.626465,29.999998 c 0.230253,1.609669 0.884298,5.000001 0.884298,5.000001 0,0 -0.617872,3.263792 -0.884298,5"
id="path17"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#008eff;stroke-width:1;stroke-dasharray:none;stroke-opacity:1"
d="m 49.000001,29.999999 -0.638719,5 L 49.000001,40"
id="path18"
sodipodi:nodetypes="ccc" />
</g>
<g
id="g20"
style="stroke:#ff6600"
transform="translate(0,-8.4666671)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff6600;stroke-width:1;stroke-dasharray:none"
d="m 47.169376,32.256753 c 0.230253,1.609669 0.341387,2.743246 0.341387,2.743246 0,0 -0.266577,1.826675 -0.533003,3.562883"
id="path19"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff6600;stroke-width:1;stroke-dasharray:none"
d="m 48.936129,32.363258 -0.574847,2.636741 0.606783,3.638722"
id="path20"
sodipodi:nodetypes="ccc" />
</g>
<g
id="g22"
transform="translate(3.6966086,-8.2860282)"
style="stroke:#ff6600">
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff6600;stroke-width:1;stroke-dasharray:none"
d="m 47.169376,32.256753 c 0.230253,1.609669 0.341387,2.743246 0.341387,2.743246 0,0 -0.266577,1.826675 -0.533003,3.562883"
id="path21"
sodipodi:nodetypes="ccc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff6600;stroke-width:1;stroke-dasharray:none"
d="m 48.936129,32.363258 -0.574847,2.636741 0.606783,3.638722"
id="path22"
sodipodi:nodetypes="ccc" />
</g>
</g>
<path
style="fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none;stroke-opacity:1;marker-end:url(#ArrowTriangleStylized)"
d="m 4.5617219,30.997399 25.0324191,0.0026"
id="path23" />
<text
xml:space="preserve"
style="font-size:4.23333px;font-family:'Latin Modern Roman';-inkscape-font-specification:'Latin Modern Roman, Normal';fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none;stroke-opacity:1"
x="-5.320653"
y="25.072666"
id="text23"><tspan
sodipodi:role="line"
id="tspan23"
style="fill:#000000;stroke:none;stroke-width:1"
x="-5.320653"
y="25.072666">whole genome duplication</tspan></text>
<path
style="fill:none;fill-opacity:0.913725;stroke:#000000;stroke-width:1;stroke-dasharray:none;stroke-opacity:1;marker-end:url(#ArrowTriangleStylized)"
d="m 4.8701727,100.96179 25.0324193,0.003"
id="path24" />
</g>
<text
xml:space="preserve"
style="font-size:4.23333px;font-family:'Latin Modern Roman';-inkscape-font-specification:'Latin Modern Roman, Normal';fill:#000000;fill-opacity:0.913725;stroke-width:1"
x="20"
y="65"
id="text2"><tspan
sodipodi:role="line"
id="tspan2"
style="stroke-width:1"
x="20"
y="65">B</tspan></text>
<text
xml:space="preserve"
style="font-size:4.23333px;font-family:'Latin Modern Roman';-inkscape-font-specification:'Latin Modern Roman, Normal';fill:#000000;fill-opacity:0.913725;stroke-width:1"
x="80.6063"
y="99.027908"
id="text3"><tspan
sodipodi:role="line"
id="tspan3"
style="stroke-width:1"
x="80.6063"
y="99.027908">unequal crossing-over</tspan></text>
<path
style="fill:none;fill-opacity:0.913725;stroke:#ffaaaa;stroke-width:1"
d="m 44.960266,113.25722 0.03973,8.74277"
id="path36" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1"
d="m 44.868446,93.051087 0.09182,20.206133"
id="path25" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ffaaaa;stroke-width:1"
d="m 54.866979,113.92631 0.01262,8.07595"
id="path32"
sodipodi:nodetypes="cc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1"
d="m 50.000001,92.999997 v 4 c 1e-6,9.000003 5.188809,4.505713 4.866978,16.926313"
id="path26"
sodipodi:nodetypes="csc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff0000;stroke-width:1"
d="m 51.002359,106.37341 c -0.500431,1.23589 -0.794678,3.15897 -0.682998,7.26333"
id="path33" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1"
d="m 54.922619,84.055247 -0.273915,12.94475 c -1.07215,7.153293 -2.715748,7.075173 -3.646345,9.373413"
id="path27" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff0000;stroke-width:1"
d="m 60.053664,104.08938 -0.10732,7.82124"
id="path29"
sodipodi:nodetypes="cc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1"
d="m 60.214294,84.055247 -0.16063,20.034133"
id="path28"
sodipodi:nodetypes="cc" />
<g
id="g40"
transform="translate(-15.287297,-0.01996951)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#ffaaaa;stroke-width:1"
d="m 145.33224,111.9049 0.0417,9.17903"
id="path37" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1"
d="m 145.2424,92.135035 0.0898,19.769865"
id="path38" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ffaaaa;stroke-width:1;stroke-dasharray:1, 1;stroke-dashoffset:0"
d="m 150.00669,111.9049 0.0417,9.17903"
id="path46" />
</g>
<g
id="g41"
transform="translate(-15.297386,-0.0183055)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff0000;stroke-width:1"
d="m 150.00494,101.6855 0.002,10.2194"
id="path39"
sodipodi:nodetypes="cc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1"
d="m 150.00493,92.135035 1e-5,9.550465"
id="path40"
sodipodi:nodetypes="cc" />
</g>
<g
id="g42"
transform="translate(8.7127035,-0.01997038)">
<path
style="fill:#ff0000;fill-opacity:0.913725;stroke:#ffaaaa;stroke-width:1"
d="m 145.33224,123.01747 0.0417,9.17903"
id="path41" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1"
d="m 145.2424,92.135035 0.0898,30.882435"
id="path42"
sodipodi:nodetypes="cc" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#ffaaaa;stroke-width:1;stroke-dasharray:1,1;stroke-dashoffset:0"
d="m 150.09477,123.01747 0.0417,9.17903"
id="path45" />
</g>
<g
id="g44"
transform="translate(8.7127035,-0.01997038)">
<path
style="fill:none;fill-opacity:0.913725;stroke:#ff0000;stroke-width:1"
d="m 150.09129,113.25497 0.0452,9.94564"
id="path43" />
<path
style="fill:none;fill-opacity:0.913725;stroke:#0000ff;stroke-width:1"
d="m 150.00493,92.135035 0.0864,21.119935"
id="path44"
sodipodi:nodetypes="cc" />
</g>
</g>
</svg>

After

Width:  |  Height:  |  Size: 18 KiB

8
folder-structure.sh Normal file
View File

@ -0,0 +1,8 @@
#!/bin/sh
find ./content -type d > folder_list.txt
mkdir -p build
cd build
cat ../folder_list.txt | xargs mkdir -p
rm ../folder_list.txt

View File

BIN
main.pdf

Binary file not shown.

Binary file not shown.

Binary file not shown.

Binary file not shown.

92
report.org Normal file
View File

@ -0,0 +1,92 @@
#+title: Further development on Finder, a pipeline to identify Tandem Arrayed Genes
#+author: Samuel Ortion
#+date: 2023-2024
#+LATEX_CLASS: scientific-project
#+LATEX_HEADER: \usepackage{sty/lamme2024}
#+latex_header_extra: \newglossaryentry{LaMME}{name={LaMME},description={Laboratoire de Mathématiques et Modélisation d'Évry}}
#+bibliography: ../references.bib
#+exclude_tags: noexport
#+options: H:7
#+options: toc:nil
# ref. https://write.as/dani/writing-a-phd-thesis-with-org-mode
#+name: acronyms
| key | abbreviation | full form |
|-----+--------------+---------------------|
| TAG | TAG | Tandem Arrayed Gene |
| FTAG | FTAG | Families and Tandem Arrayed Gene |
#+begin_export latex
\hypersetup{
pdfauthor={Samuel Ortion},
pdftitle={},
pdfkeywords={duplicate genes, workflow management systems, pipeline},
}
\pagenumbering{roman}
#+end_export
#+begin_abstract
Duplicate genes is an important component of genomes. They have a particular role in genome evolution, allowing species to explore new gene functionality offering a pool of usable genes to build on.
TODO:
#+end_abstract
#+begin_center
*keywords*: duplicate genes, tandem arrayed genes, pipeline
#+end_center
#+begin_export latex
\tableofcontents
#+end_export
[[printglossaries:]]
#+begin_export latex
\pagenumbering{arabic}
#+end_export
* Context
** What are duplicate genes?
Duplicate genes are genes that experienced a duplication event during species evolution.
These are homologous genes.
*** Duplication mechanisms
#+name: fig:gene-duplication-mechanisms
#+CAPTION: Mechanisms leading to gene duplication
[[./figures/lallemand2020-fig1_copy.pdf]]
Several mechanisms may lead to gene duplication. We review them in this section.
**** Segment duplication
**** Retroduplication
Transposable elements cause an important part of gene duplication [citation needed]
Retrotransposon, or RNA transposon is one type of transposable element. Some of the representant of retrotransposon are similar to retroviruses.
Retrotransposon may be duplicated in the genome through a mechanism known as "copy-and-paste".
These transposons are typically composed of a reverse transcriptase gene. The protein encoded by this gene may proceed in the reverse transcription of the RNA transcript of the transposon sequence resulting in a DNA sequence which can then be included elsewhere in the genome.
During this process, the RNA transcript may include nearby gene sequence, which can thus be copied and pasted along with the retrotransposon.
**** Transduplication
DNA transposon is an other type of transposable element whose transposition mechanisms can lead to gene duplication too.
This type of transposable element moves in the genome through a mechanisms known as "cut-and-paste".
The typical DNA transposon contains a transposase gene. The protein encoded by this gene recognize two sites surrounding the donnor transposon sequence in the chromosome resulting in a DNA cleavage. The transposase can then insert the transposon in a new place of the genome.
Similarly to retrotransposon, if a gene was present between the two cleavage sites of the donnor transposon, it may move with the transposed sequence.
**** Tandem Duplication
**** Polyploidisation
***** Alloployploïdisation
***** Autopolyploïdisation
***** Mechanisms
****** Polyspermy
****** Non-reduced gametes
**** Unequal crossing-over
A crossing-over may occur during cell division. A fragment of chromosome is exchanged between two chromatids of a pair of chromosome. If the cleavage of the two chromatids occured at different positions on both chromosomes, the shared fragments may have different lengths. When the repair of missing fragment is performed, the resulting chromosome will incorporate a duplicate region of the chromosome, leading to a potential duplication for genes present in this region, as represented in figure [[fig:gene-duplication-mechanisms]] B. # TODO: check that this is really the B subfigure
*** Role in genome evolution
** Identification of duplicate genes
***
*** Finder
* Objectives
** Amend the existing Galaxy pipeline
Last year, a M1 student, Seanna Charles, worked on the Galaxy's version of the gls: Finder pipeline [cite:@charlesFinalisationPipelineFTAG2023].
During my internship, I will continue this work.
** Porting Finder pipeline on a workflow manager
#+begin_export latex
\printbibliography
#+end_export

BIN
report.pdf (Stored with Git LFS) Normal file

Binary file not shown.

111
report.tex Normal file
View File

@ -0,0 +1,111 @@
% Created 2024-03-26 Tue 15:13
% Intended LaTeX compiler: lualatex
\documentclass{scrbook}
\usepackage{sty/lamme2024}
\newacronym{TAG}{TAG}{Tandem Arrayed Gene}
\newacronym{FTAG}{FTAG}{Families and Tandem Arrayed Gene}
\newglossaryentry{LaMME}{name={LaMME},description={Laboratoire de Mathématiques et Modélisation d'Évry}}
\makeindex
\makeglossaries
\usepackage{minted}
\author{Samuel Ortion}
\date{2023-2024}
\title{Further development on Finder, a pipeline to identify Tandem Arrayed Genes}
\hypersetup{
pdfauthor={Samuel Ortion},
pdftitle={Further development on Finder, a pipeline to identify Tandem Arrayed Genes},
pdfkeywords={},
pdfsubject={},
pdfcreator={Emacs 29.2 (Org mode 9.7)},
pdflang={English}}
\usepackage{biblatex}
\addbibresource{../references.bib}
\begin{document}
\maketitle
\hypersetup{
pdfauthor={Samuel Ortion},
pdftitle={},
pdfkeywords={duplicate genes, workflow management systems, pipeline},
}
\pagenumbering{roman}
\begin{abstract}
Duplicate genes is an important component of genomes. They have a particular role in genome evolution, allowing species to explore new gene functionality offering a pool of usable genes to build on.
TODO:
\end{abstract}
\begin{center}
\textbf{keywords}: duplicate genes, tandem arrayed genes, pipeline
\end{center}
\tableofcontents
\printglossaries
\pagenumbering{arabic}
\part{Context}
\label{sec:org8d0fa24}
\chapter{What are duplicate genes?}
\label{sec:orgee68751}
Duplicate genes are genes that experienced a duplication event during species evolution.
These are homologous genes.
\section{Duplication mechanisms}
\label{sec:orgcf44cad}
\begin{center}
\includegraphics[width=.9\linewidth]{./figures/lallemand2020-fig1_copy.pdf}
\caption{\label{fig:gene-duplication-mechanisms}Mechanisms leading to gene duplication}
\end{center}
Several mechanisms may lead to gene duplication. We review them in this section.
\subsection{Segment duplication}
\label{sec:org922a1dd}
\subsection{Retroduplication}
\label{sec:orgd8f7e18}
Transposable elements cause an important part of gene duplication [citation needed]
Retrotransposon, or RNA transposon is one type of transposable element. Some of the representant of retrotransposon are similar to retroviruses.
Retrotransposon may be duplicated in the genome through a mechanism known as ``copy-and-paste''.
These transposons are typically composed of a reverse transcriptase gene. The protein encoded by this gene may proceed in the reverse transcription of the RNA transcript of the transposon sequence resulting in a DNA sequence which can then be included elsewhere in the genome.
During this process, the RNA transcript may include nearby gene sequence, which can thus be copied and pasted along with the retrotransposon.
\subsection{Transduplication}
\label{sec:org74a527a}
DNA transposon is an other type of transposable element whose transposition mechanisms can lead to gene duplication too.
This type of transposable element moves in the genome through a mechanisms known as ``cut-and-paste''.
The typical DNA transposon contains a transposase gene. The protein encoded by this gene recognize two sites surrounding the donnor transposon sequence in the chromosome resulting in a DNA cleavage. The transposase can then insert the transposon in a new place of the genome.
Similarly to retrotransposon, if a gene was present between the two cleavage sites of the donnor transposon, it may move with the transposed sequence.
\subsection{Tandem Duplication}
\label{sec:org1185c12}
\subsection{Polyploidisation}
\label{sec:org349eaa4}
\subsubsection{Alloployploïdisation}
\label{sec:org323512f}
\subsubsection{Autopolyploïdisation}
\label{sec:orgba5b73e}
\subsubsection{Mechanisms}
\label{sec:orga1009de}
\paragraph{Polyspermy}
\label{sec:orgee32a5c}
\paragraph{Non-reduced gametes}
\label{sec:org3297de6}
\subsection{Unequal crossing-over}
\label{sec:org31e5f76}
A crossing-over may occur during cell division. A fragment of chromosome is exchanged between two chromatids of a pair of chromosome. If the cleavage of the two chromatids occured at different positions on both chromosomes, the shared fragments may have different lengths. When the repair of missing fragment is performed, the resulting chromosome will incorporate a duplicate region of the chromosome, leading to a potential duplication for genes present in this region, as represented in figure \ref{fig:gene-duplication-mechanisms} B. \# TODO: check that this is really the B subfigure
\section{Role in genome evolution}
\label{sec:orga7bdfd9}
\chapter{Identification of duplicate genes}
\label{sec:org3aec87b}
\textbf{*}
\section{Finder}
\label{sec:org9b93040}
\part{Objectives}
\label{sec:org1b30340}
\chapter{Amend the existing Galaxy pipeline}
\label{sec:orgf108b0f}
Last year, a M1 student, Seanna Charles, worked on the Galaxy's version of the gls: Finder pipeline \autocite{charlesFinalisationPipelineFTAG2023}.
During my internship, I will continue this work.
\chapter{Porting Finder pipeline on a workflow manager}
\label{sec:orgd5c8063}
\printbibliography
\end{document}

View File

@ -1,31 +1,47 @@
% https://www.developpez.net/forums/d910711/autres-langages/autres-langages/latex/mise-forme/texte-recto-figures-verso/ % https://www.developpez.net/forums/d910711/autres-langages/autres-langages/latex/mise-forme/texte-recto-figures-verso/
% Solution by Martigan on Developpez.net % Solution by Martigan on Developpez.net
\iffalse
\RequirePackage{afterpage} \RequirePackage{afterpage}
\RequirePackage{caption} \RequirePackage{caption}
\newcommand\@addfig{\relax} \newcommand\@addfig{\relax}
\newcommand\addfig[1]{\global\long\def\@addfig{#1}} \newcommand\addfig[1]{\global\long\def\@addfig{#1}}
\newcommand\@putfig{\@addfig\addfig{\relax}} \newcommand\@putfig{\@addfig\addfig{\relax}}
\newcommand\blankpage{% \newcommand\flblankpage{%
\null \null
\vfill \vfill
\begin{figure}[H]
\captionsetup{type=figure} % Warning: this could be faulty if tables are required \captionsetup{type=figure} % Warning: this could be faulty if tables are required
\@putfig% \@putfig%
\end{figure}
\vfill \vfill
\thispagestyle{empty}% \thispagestyle{empty}%
\clearpage% \clearpage%
\addtocounter{page}{-1} %\addtocounter{page}{-1}
\afterpage{\blankpage} \afterpage{\flblankpage}
} }
\iffalse \iffalse
% Example % Example
\addfig{%
% Add this at the beggining of the document:
\afterpage{\flblankpage}
\addfig{%
\centering \centering
\includegraphics[scale=1]{Image1} \includegraphics[scale=1]{Image1}
\caption{Test} \caption{Test}
\label{Ima1} \label{Ima1}
} }
\fi \fi
\fi
\def\@floatplacement{\global\@topnum\c@topnumber
\global\@toproom \topfraction\@colht
\global\@botnum \c@bottomnumber
\global\@botroom \bottomfraction\@colht
\global\@colnum \ifodd\c@page\c@totalnumber\else\z@\fi%<<<<<<<
\@fpmin \floatpagefraction\@colht}

View File

@ -1,23 +1,10 @@
\usepackage{graphicx} % Font
\usepackage{tikz}
\usepackage{xcolor}
\usepackage{hyperref}
\usepackage{fontspec} \usepackage{fontspec}
\setmainfont{TeX Gyre Termes} % Times New Roman alternative \setmainfont{TeX Gyre Termes} % Times New Roman alternative
\usepackage{setspace} \usepackage{setspace}
\onehalfspacing % 1.5 interline spacing \onehalfspacing % 1.5 interline spacing
\defaultfontfeatures[\rmfamily,\sffamily]{Ligatures=TeX} \defaultfontfeatures[\rmfamily,\sffamily]{Ligatures=TeX}
\addtokomafont{disposition}{\rmfamily}
% Force text on right side, float on left side
\usepackage{sty/floatlefttextright}
% Font
\RequirePackage{polyglossia}
\setmainlanguage{english}
%\setotherlanguage{french}
% Float % Float
@ -26,13 +13,13 @@
\RequirePackage{caption} \RequirePackage{caption}
\RequirePackage{subcaption} \RequirePackage{subcaption}
\RequirePackage{xcolor} \RequirePackage{xcolor}
\RequirePackage{csquotes}
\RequirePackage[english]{babel}
% Math % Math
\RequirePackage{amsmath} \RequirePackage{amsmath}
\RequirePackage{amsthm} \RequirePackage{amsthm}
\RequirePackage{amssymb} \RequirePackage{amssymb}
\usepackage{enumitem} \usepackage{enumitem}
\usepackage{lipsum} \usepackage{lipsum}
@ -45,8 +32,8 @@
citestyle=authoryear-comp, citestyle=authoryear-comp,
natbib=true natbib=true
]{biblatex} ]{biblatex}
\RequirePackage{doi} %\RequirePackage{doi}
\RequirePackage{xurl} %\RequirePackage{xurl}
\RequirePackage{orcidlink} \RequirePackage{orcidlink}
@ -68,3 +55,26 @@
stylemods=longbooktabs, % do the adjustments for the longbooktabs styles, stylemods=longbooktabs, % do the adjustments for the longbooktabs styles,
automake automake
]{glossaries-extra} ]{glossaries-extra}
\usepackage{hyperref}
% Force text on right side, float on left side
% \usepackage{sty/floatlefttextright}
\makeglossaries
\makeindex
\renewcommand\maketitle{\include{titlepage}}
% Abstract
\providecommand{\abstractname}{Abstract} % not in scrbook class
\newenvironment{abstract}[1]{%
\hrule
\small\textbf{\abstractname: }
%\small\emph #1 % emph takes an argument
\small\emph{#1} % or \small\textit{#1}
\itshape % use this if you want the text to be in italics
}{%
\newline\hrule
\vspace{0.6cm}
}

BIN
sty/test_figurelefttextright.pdf (Stored with Git LFS) Normal file

Binary file not shown.

View File

@ -0,0 +1,19 @@
\documentclass{book}
\usepackage{floatlefttextright}
\usepackage{lipsum}
\usepackage{graphicx}
\begin{document}
\afterpage{\blankpage}
\lipsum{100}
\addfig{
\includegraphics[width=\textwidth]{example-image-a}
\caption{Test figure}
\label{fig:Test figure}
}
\end{document}

View File

@ -11,15 +11,16 @@
\Large 2023--2024 \Large 2023--2024
\hfill \vfill
\Huge Samuel ORTION \orcidlink{0009-0001-0971-497X} \Large Samuel ORTION \orcidlink{0009-0001-0971-497X}
\vfill \vfill
\Huge \LARGE
\makeatletter
Development of a Nextflow\footnote{We still need to decide which workflow manager to choose: Nextflow or Snakemake} pipeline for FTAG Finder, a duplicate gene detection tool, and improvement of the existing Galaxy implementation \@title
\makeatother
\vfill \vfill
\normalsize \normalsize