forked from JRaviLab/MolEvolvR
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathcreateIPRScanDomainTable.Rd
More file actions
44 lines (40 loc) · 1.56 KB
/
createIPRScanDomainTable.Rd
File metadata and controls
44 lines (40 loc) · 1.56 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/fa2domain.R
\name{createIPRScanDomainTable}
\alias{createIPRScanDomainTable}
\title{For a given accession number, get the domain sequences using a interproscan
output table & the original FASTA file}
\usage{
createIPRScanDomainTable(
accnum,
fasta,
df_iprscan,
analysis = c("Pfam", "Gene3D")
)
}
\arguments{
\item{accnum}{\link[rlang:vector-construction]{rlang::chr} a \emph{single} accession number from the original fasta (fasta param)
which will be used to search for its sequence's domains (df_iprscan param)}
\item{fasta}{\link[Biostrings:XStringSet-class]{Biostrings::AAStringSet} original fasta file which was fed into interproscan}
\item{df_iprscan}{\link{tbl_df} the output TSV of interproscan, read as a tibble with
readIPRScanTSV()}
\item{analysis}{\link[rlang:vector-construction]{rlang::chr} the domain databases to extract sequences from}
}
\value{
\link{tbl_df} table with each domain sequence and a new identifier column
}
\description{
For a given accession number, get the domain sequences using a interproscan
output table & the original FASTA file
}
\examples{
\dontrun{
path_molevol_scripts <- file.path(Sys.getenv("DEV", unset = "/data/molevolvr_transfer/molevolvr_dev"), "molevol_scripts")
setwd(path_molevol_scripts)
source("R/fa2domain.R")
fasta <- Biostrings::readAAStringSet("./tests/example_protein.fa")
df_iprscan <- readIPRScanTSV("./tests/example_iprscan_valid.tsv")
accnum <- df_iprscan$AccNum[1]
df_iprscan_domains <- createIPRScanDomainTable(accnum, fasta, df_iprscan)
}
}