Versions Compared

Key

  • This line was added.
  • This line was removed.
  • Formatting was changed.
Comment: yeast_rna to yeast_rnaseq and sacCer_64 to sacCer3.64

...

Code Block
languagebash
titleLook at GFF annotation entries with less
mkdir -p $SCRATCH/core_ngs/bedtools
cd $SCRATCH/core_ngs/bedtools 
cp $CORENGS/yeast_rnarnaseq/sacCer_sacCer3.R64-1-1_20110208.gff . 
cp $CORENGS/yeast_rna/yeast_mrna.sort.filt.bam* .

# Use the less pager to look at multiple lines
less sacCer_sacCer3.R64-1-1_20110208.gff

# Look at just the most-important Tab-separated columns
cat sacCer_sacCer3.R64-1-1_20110208.gff | grep -v '#' | cut -f 1,3-5 | head -20

# Include the ugly 9th column where attributes are stored
cat sacCer_sacCer3.R64-1-1_20110208.gff | grep -v '#' | cut -f 1,3,9 | head

...

Expand
titleSetup (if needed)


Code Block
languagebash
mkdir -p $SCRATCH/core_ngs/bedtools
cd $SCRATCH/core_ngs/bedtools
cp $CORENGS/yeast_rnarnaseq/sacCer_sacCer3.R64-1-1_20110208.gff .



Code Block
languagebash
titleCreate a histogram of all the feature types in a GFF
cd $SCRATCH/core_ngs/bedtools
cat sacCer_sacCer3.R64-1-1_20110208.gff | grep -v '^#' | cut -f 3 | \
  sort | uniq -c | sort -k1,1nr | more

...

Code Block
titleFilter GFF gene feature with awk
cat sacCer_sacCer3.R64-1-1_20110208.gff | grep -v '#' | \
  awk 'BEGIN{FS=OFS="\t"}{ if($3=="gene"){print} }' \
  > sc_genes.gff
wc -l sc_genes.gff

...