forked from satijalab/seurat
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathFindVariableFeatures.Rd
132 lines (116 loc) · 4.44 KB
/
FindVariableFeatures.Rd
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/generics.R, R/preprocessing.R
\name{FindVariableFeatures}
\alias{FindVariableFeatures}
\alias{FindVariableGenes}
\alias{FindVariableFeatures.default}
\alias{FindVariableFeatures.Assay}
\alias{FindVariableFeatures.Seurat}
\title{Find variable features}
\usage{
FindVariableFeatures(object, ...)
\method{FindVariableFeatures}{default}(
object,
selection.method = "vst",
loess.span = 0.3,
clip.max = "auto",
mean.function = FastExpMean,
dispersion.function = FastLogVMR,
num.bin = 20,
binning.method = "equal_width",
verbose = TRUE,
...
)
\method{FindVariableFeatures}{Assay}(
object,
selection.method = "vst",
loess.span = 0.3,
clip.max = "auto",
mean.function = FastExpMean,
dispersion.function = FastLogVMR,
num.bin = 20,
binning.method = "equal_width",
nfeatures = 2000,
mean.cutoff = c(0.1, 8),
dispersion.cutoff = c(1, Inf),
verbose = TRUE,
...
)
\method{FindVariableFeatures}{Seurat}(
object,
assay = NULL,
selection.method = "vst",
loess.span = 0.3,
clip.max = "auto",
mean.function = FastExpMean,
dispersion.function = FastLogVMR,
num.bin = 20,
binning.method = "equal_width",
nfeatures = 2000,
mean.cutoff = c(0.1, 8),
dispersion.cutoff = c(1, Inf),
verbose = TRUE,
...
)
}
\arguments{
\item{object}{An object}
\item{...}{Arguments passed to other methods}
\item{selection.method}{How to choose top variable features. Choose one of :
\itemize{
\item{vst:}{ First, fits a line to the relationship of log(variance) and
log(mean) using local polynomial regression (loess). Then standardizes the
feature values using the observed mean and expected variance (given by the
fitted line). Feature variance is then calculated on the standardized values
after clipping to a maximum (see clip.max parameter).}
\item{mean.var.plot (mvp):}{ First, uses a function to calculate average
expression (mean.function) and dispersion (dispersion.function) for each
feature. Next, divides features into num.bin (deafult 20) bins based on
their average expression, and calculates z-scores for dispersion within
each bin. The purpose of this is to identify variable features while
controlling for the strong relationship between variability and average
expression.}
\item{dispersion (disp):}{ selects the genes with the highest dispersion values}
}}
\item{loess.span}{(vst method) Loess span parameter used when fitting the
variance-mean relationship}
\item{clip.max}{(vst method) After standardization values larger than
clip.max will be set to clip.max; default is 'auto' which sets this value to
the square root of the number of cells}
\item{mean.function}{Function to compute x-axis value (average expression).
Default is to take the mean of the detected (i.e. non-zero) values}
\item{dispersion.function}{Function to compute y-axis value (dispersion).
Default is to take the standard deviation of all values}
\item{num.bin}{Total number of bins to use in the scaled analysis (default
is 20)}
\item{binning.method}{Specifies how the bins should be computed. Available
methods are:
\itemize{
\item{equal_width:}{ each bin is of equal width along the x-axis [default]}
\item{equal_frequency:}{ each bin contains an equal number of features (can
increase statistical power to detect overdispersed features at high
expression values, at the cost of reduced resolution along the x-axis)}
}}
\item{verbose}{show progress bar for calculations}
\item{nfeatures}{Number of features to select as top variable features;
only used when \code{selection.method} is set to \code{'dispersion'} or
\code{'vst'}}
\item{mean.cutoff}{A two-length numeric vector with low- and high-cutoffs for
feature means}
\item{dispersion.cutoff}{A two-length numeric vector with low- and high-cutoffs for
feature dispersions}
\item{assay}{Assay to use}
}
\description{
Identifies features that are outliers on a 'mean variability plot'.
}
\details{
For the mean.var.plot method:
Exact parameter settings may vary empirically from dataset to dataset, and
based on visual inspection of the plot. Setting the y.cutoff parameter to 2
identifies features that are more than two standard deviations away from the
average dispersion within a bin. The default X-axis function is the mean
expression level, and for Y-axis it is the log(Variance/mean). All mean/variance
calculations are not performed in log-space, but the results are reported in
log-space - see relevant functions for exact details.
}