...
https://www.ncbi.nlm.nih.gov/genome/browse/#!/eukaryotes/11236/
Fetch for phospholipase proteins:
Code Block |
---|
#step1: decompress file
gzip -d GCA_015679415.1_UCR_MalpAD072_1.0_protein.faa.gz
#step2: wrap sequence to one line
python2.7 /work/speight_team/projects/yeast_genomes/scripts/extract_seqs.py GCA_015679415.1_UCR_MalpAD072_1.0_protein.faa 0 > GCA_015679415.1_UCR_MalpAD072_1.0_protein.mod.faa
#use grep to fetch name of interest
grep -A 1 "Phospholipase" GCA_015679415.1_UCR_MalpAD072_1.0_protein.mod.faa | sed '/^--$/d' > Phospholipase_proteins.fasta |