mvpa.measures.anova

29 """`FeaturewiseDatasetMeasure` that performs a univariate ANOVA. 30 31 F-scores are computed for each feature as the standard fraction of between 32 and within group variances. Groups are defined by samples with unique 33 labels. 34 35 No statistical testing is performed, but raw F-scores are returned as a 36 sensitivity map. As usual F-scores have a range of [0,inf] with greater 37 values indicating higher sensitivity. 38 """ 39

40 - def _call(self, dataset, labels=None):

41 # This code is based on SciPy's stats.f_oneway() 42 # Copyright (c) Gary Strangman. All rights reserved 43 # License: BSD 44 # 45 # However, it got tweaked and optimized to better fit into PyMVPA. 46 47 # number of groups 48 if labels is None: 49 labels = dataset.labels 50 51 ul = N.unique(labels) 52 53 na = len(ul) 54 bign = float(dataset.nsamples) 55 alldata = dataset.samples 56 57 # total squares of sums 58 sostot = N.sum(alldata, axis=0) 59 sostot *= sostot 60 sostot /= bign 61 62 # total sum of squares 63 sstot = N.sum(alldata * alldata, axis=0) - sostot 64 65 # between group sum of squares 66 ssbn = 0 67 for l in ul: 68 # all samples for the respective label 69 d = alldata[labels == l] 70 sos = N.sum(d, axis=0) 71 sos *= sos 72 ssbn += sos / float(len(d)) 73 74 ssbn -= sostot 75 # within 76 sswn = sstot - ssbn 77 78 # degrees of freedom 79 dfbn = na-1 80 dfwn = bign - na 81 82 # mean sums of squares 83 msb = ssbn / float(dfbn) 84 msw = sswn / float(dfwn) 85 f = msb / msw 86 # assure no NaNs -- otherwise it leads instead of 87 # sane unittest failure (check of NaNs) to crazy 88 # File "mtrand.pyx", line 1661, in mtrand.shuffle 89 # TypeError: object of type 'numpy.int64' has no len() 90 # without any sane backtrace 91 f[N.isnan(f)] = 0 92 93 return f

101 """Compound comparisons via univariate ANOVA. 102 103 Provides F-scores per each label if compared to the other labels. 104 """ 105

106 - def _call(self, dataset):

107 """Computes featurewise f-scores using compound comparisons.""" 108 109 orig_labels = dataset.labels 110 labels = orig_labels.copy() 111 112 results = [] 113 for ul in dataset.uniquelabels: 114 labels[orig_labels == ul] = 1 115 labels[orig_labels != ul] = 2 116 results.append(OneWayAnova._call(self, dataset, labels)) 117 118 # features x labels 119 return N.array(results).T

Source Code for Module mvpa.measures.anova