Skip to content
Snippets Groups Projects
Commit 8cf68c24 authored by Holger Brandl's avatar Holger Brandl
Browse files

cont. expression data prep

parent bbde64d6
No related branches found
No related tags found
No related merge requests found
......@@ -98,7 +98,7 @@ rownames2column <- function(df, colname){
df <- as.df(df)
df$tttt <- rownames(df);
rownames(df) <- NULL;
rename(df, c(tttt=colname))
plyr::rename(df, c(tttt=colname))
}
......
......@@ -181,3 +181,25 @@ BlastProgress(){
done
}
export -f BlastProgress
## just retains sequences whose id is in id-file (format: 1id per line)
FilterFastaByIDFile(){
python -c '
from Bio import SeqIO
import sys
#http://stackoverflow.com/questions/3925614/how-do-you-read-a-file-into-a-list-in-python
with open(sys.argv[1]) as f:
some_list = f.read().splitlines()
for record in SeqIO.parse(sys.stdin, "fasta"):
# recordID=record.description.split(" ")[1]
recordID=record.id
# print "processing" + recordID
# http://stackoverflow.com/questions/3437059/does-python-have-a-string-contains-method
if recordID in some_list: print record.format("fasta")
' $1;
}
export -f FilterFastaByIDFile
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment