2024-10-28 10:46:05 +01:00
|
|
|
#!/usr/bin/env -S awk -f
|
|
|
|
# Convert mcl output into tsv output
|
|
|
|
# with two columns 'gene id, family identifier'
|
|
|
|
|
|
|
|
BEGIN {
|
|
|
|
family_identifier=0
|
|
|
|
OFS="\t"
|
2024-11-04 11:37:20 +01:00
|
|
|
FS=" "
|
2024-10-28 10:46:05 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
{
|
|
|
|
family_identifier++
|
2024-11-04 11:37:20 +01:00
|
|
|
for (i=1; i <= NF; i++) {
|
|
|
|
print $i, family_identifier
|
2024-10-28 10:46:05 +01:00
|
|
|
}
|
|
|
|
}
|