Postagens

Mostrando postagens de outubro, 2015

Merge de reads x lncRNAs no R

system("pwd") HCLnc <-read.delim(file="/work/srsilva/AssemblyUvul.HCLnclist.out",stringsAsFactors=FALSE) HCLnc <-read.delim(file="/work/srsilva/Assembly/Uvul.HCLnclist.out",stringsAsFactors=FALSE) HCLnc <-read.delim(file="/work/srsilva/Assembly/HCLnc/Uvul.HCLnclist.out",stringsAsFactors=FALSE) colnames(HCLnc) <- c('IDreads') concatena <-merge(x=readsvsmontagem, y=HCLnc, by='IDreads' ) concatena dim(concatena) /U_vulgaris/Assemb/DBBwtUvulgaris/Uvul-counts.txt", stringsAsFactors=FALSE, header=FALSE) colnames(readsvsmontagem) <-c('IDreads','count') colnames(HCLnc) <- c('IDreads') concatena <-merge(x=readsvsmontagem, y=HCLnc, by='IDreads') dim(concatena) dim(HCLnc) dim(readsvsmontagem) sel <- c("isotig38248","isotig32047","isotig38212","isotig35263","isotig40992","isotig02091","isotig02090","isotig

Usando o merge no R

> matchesfolhas <-read.delim(file="folha-rRNA.sam.ids", header=FALSE, stringsAsFactors=FALSE) > colnames(matchesfolhas) <- c('IDread','IDsilva') > silvaclass <- read.delim(file="../../../tmp/SILVA_119.txt", header=FALSE, stringsAsFactors=FALSE) > colnames(silvaclass) <- c('IDsilva','IDclass') > res <- merge(x=matchesfolhas, y=silvaclass, by='IDsilva') Para procurar vetor de strings subset(res,IDclass %in% outralistaqualquer)

extraindo lista de arquivos fasta

extraindo lista de arquivos fasta grep '>' Pvulgaris.Lnc.out-1438107679-HighConfidencelncRNA.fa | sed 's/>//' |