1 MEDA run

Loading the class labels sent by Forrest

cl <- read.csv("cleft_class.csv")[-18,]
f0 <- read.csv("collman15v2_tightAnnotationsF0.csv")
sf0 <- scale(f0, center = TRUE, scale = TRUE)

loc <- read.csv("locationstest20171211.csv")

table(cl$gaba)

## 
##   0   1 
## 214  22

table(cl$postgaba)

## 
##   0   1 
## 212  24

#ccol <- read.csv("params.csv")[1,-c(1,14)]
ccol <- c('blue', 'blue', 'blue', 'red', 'red', 'red', 'black', 'black', 'green', 'green', 'green', 'green')
set.seed(1030)
L <- runAll(sf0, ccol = ccol)
L[[1]] <- mlocation(f0, ccol = ccol)

1.1 mlocation

1.2 d1heat

1.3 cumvar

1.4 outliers

1.5 pairhex

1.6 correlation

1.7 dendrogram

##      1     21     22 
## 0.7712 0.1314 0.0975

1.8 pairs plots

1.9 stacked means

1.10 cluster means

2 Set \(K = 2\)

Here we restrict our hierarchical GMM function to one split only and then compare with the true gaba/non-gaba class labels.

set.seed(1030)
h2 <- hmc(sf0, maxDepth = 2)
l2 <- h2$dat$labels$col - 1
p0 <- mclust::adjustedRandIndex(l2, cl$gaba)

perms <- foreach(i = 1:1e4, .combine = c) %dopar% {
  set.seed(i*2)
  mclust::adjustedRandIndex(sample(l2), cl$gaba)
}

tmp <- h2$dat$labels$col
pairs(h2$dat$data, 
      col = viridis(max(tmp))[tmp],
      pch = 19, cex = 0.5, main = "colored by prediction")

pairs(h2$dat$data, 
      col = c('darkblue', 'violet')[cl$gaba +1],
      pch = 19, cex = 0.5, main = "colored by truth")

plotDend(h2)

##      1      2 
## 0.8093 0.1907

stackM(h2, depth = 2, centered = TRUE, ccol = ccol)

hist(perms, xlim = c(min(perms), p0 + 0.25*p0),
     main = "permutation test of ARI values")
abline(v = p0, col = 'red')

df1 <- data.frame(loc)
df1$gaba <- as.factor(cl$gaba)
df1$classification <- as.factor(tmp -1)
df1$correct_classification <- (df1$classification == df1$gaba)
df1$TN <- (df1$classification == 0 & df1$gaba == 0)
df1$FN <- (df1$classification == 0 & df1$gaba == 1)
df1$FP <- (df1$classification == 1 & df1$gaba == 0)
df1$TP <- (df1$classification == 1 & df1$gaba == 1)
#df1$text <- links

p1 <- ggplot(df1, aes(x = x, y=y,z=z, col = gaba, shape =
                      correct_classification)) + 
  facet_wrap(~ z, ncol = 6) +
  geom_point()

p1

2.0.1 same as above with interactivity

ggplotly(p1)

#p2 <- plot_ly(df1, x = ~x, y = ~y, color = ~gaba,
#             hoverinfo = 'text',
#               text = ~links)
#p2
#
#htmlwidgets::saveWidget(as_widget(p2), "links.html")

2.0.2 Confusion matrix (classfication on rows)

(ta <- table(classification = tmp-1, df1$gaba))

##               
## classification   0   1
##              0 189   2
##              1  25  20

The above table shows that out of 22 true gaba synapses 2 were mis-classified as non-gaba synapses.

3 NDVIZ Links

Note that the centroids are caluclated from the annotations which means that the centorid might not be in an area with annotated pixels.

3.1 False Negatives (synaptograms here)

FalseNegatives
3826, 2554, 18
4065, 2605, 15

3.2 False Positives (some synaptograms here)

FalsePositives
5102, 2539, 0
3193, 539, 2
4613, 3669, 5
768, 2558, 5
5835, 2977, 2
6112, 1638, 26
3218, 1449, 26
3839, 1906, 22
2808, 1718, 21
3550, 1713, 24
3265, 4081, 26
3158, 4215, 22
1596, 3310, 26
1071, 2972, 24
2647, 2363, 24
2493, 2017, 26
2016, 561, 5
1460, 494, 25
3570, 3589, 16
4155, 983, 6
3821, 288, 13
1556, 3830, 4
3628, 1650, 15
1763, 4154, 19
49, 3870, 8

3.3 True Negatives

TrueNegatives
3560, 3204, 2
2999, 3350, 1
2685, 3818, 0
2133, 3801, 1
2070, 4025, 1
2425, 3367, 2
3511, 2416, 2
3226, 1814, 3
4439, 3236, 0
4024, 2881, 2
1524, 1851, 1
4330, 1221, 0
5085, 1099, 1
805, 3803, 1
2026, 2395, 4
467, 2539, 1
1029, 2558, 0
1604, 2988, 1
3647, 564, 1
4365, 889, 1
5551, 3312, 3
3503, 3552, 2
1142, 1387, 1
3185, 2674, 0
900, 2305, 3
5596, 2382, 1
1346, 3314, 1
1583, 2292, 3
4434, 3053, 4
4557, 1194, 2
4333, 513, 2
5132, 710, 4
4972, 3480, 5
1402, 1486, 7
4064, 1733, 4
100, 1149, 5
5465, 4259, 24
5814, 4127, 23
4861, 4114, 25
4300, 3979, 25
5171, 4076, 23
5268, 3631, 22
4774, 3282, 20
5652, 2648, 24
5885, 2935, 23
4967, 2979, 16
6069, 1825, 26
5566, 1788, 23
4392, 2182, 19
4582, 2195, 26
5630, 1483, 25
4858, 1346, 23
4412, 1316, 25
5913, 1133, 23
5415, 1105, 22
5343, 633, 19
5693, 851, 18
5454, 634, 14
4378, 908, 26
4164, 821, 26
2962, 1788, 22
3534, 1538, 21
3710, 892, 15
3302, 747, 21
2859, 1440, 19
2873, 1205, 23
3580, 2135, 24
2973, 2097, 26
2956, 2535, 21
3459, 2581, 13
4645, 2232, 10
3787, 1628, 8
3466, 1907, 14
3090, 3180, 24
3533, 3270, 22
3253, 3538, 25
3445, 3854, 21
2861, 2954, 21
2940, 4491, 25
3162, 4384, 23
2651, 3604, 26
2675, 4016, 26
2355, 4206, 24
1060, 3696, 25
1101, 3876, 22
1875, 2960, 18
2000, 2605, 25
2373, 3113, 21
1263, 2880, 11
1501, 3053, 15
1525, 2556, 23
1882, 1665, 24
2295, 1651, 22
1765, 1573, 18
1950, 1746, 15
2661, 2526, 11
2137, 2033, 8
2025, 2119, 4
2777, 1769, 5
2013, 1689, 5
2073, 2652, 6
3449, 1659, 10
3088, 1893, 13
1984, 2121, 21
951, 1797, 23
1193, 1885, 16
1552, 1736, 16
1384, 2208, 16
1649, 2302, 14
863, 2498, 17
2389, 1772, 25
2660, 1079, 24
2348, 980, 22
1349, 815, 23
1032, 609, 24
1786, 592, 17
1599, 975, 15
2724, 1529, 11
2594, 1415, 9
1239, 852, 10
1028, 471, 7
1640, 1112, 7
1741, 1043, 8
928, 1435, 10
2520, 1173, 16
1606, 1223, 18
1191, 3904, 16
1264, 4139, 17
2170, 3900, 12
826, 3368, 10
366, 3660, 6
324, 3745, 24
3132, 3622, 18
3785, 3199, 12
3162, 2794, 9
2857, 3221, 9
2697, 3109, 11
2632, 3540, 9
3344, 4031, 14
5285, 3893, 15
5102, 4188, 15
5344, 3309, 15
5029, 3504, 15
4274, 2931, 15
4309, 3761, 8
4840, 3600, 7
4779, 3159, 5
4151, 3097, 7
4211, 3354, 4
4179, 3619, 5
3985, 3871, 6
4382, 1557, 11
4501, 1340, 8
4748, 911, 5
4665, 656, 6
3313, 706, 11
4333, 525, 15
4654, 519, 15
3525, 404, 12
3612, 612, 11
3117, 365, 11
3024, 998, 11
5283, 1262, 12
5229, 2296, 12
5027, 2444, 15
4694, 1845, 13
1090, 2643, 5
1514, 2361, 10
683, 2227, 9
1214, 1707, 7
3219, 1667, 15
3427, 1440, 14
2842, 1317, 15
2290, 1014, 13
4132, 2014, 7
647, 355, 7
356, 242, 12
587, 1393, 20
1153, 315, 15
1863, 3557, 15
1926, 4136, 3
2463, 4077, 3
3590, 2048, 7
4933, 199, 8
4362, 3582, 16
5483, 2421, 4
4571, 3913, 20
759, 1222, 13
62, 3399, 10

3.4 True Positives

TruePositives
2157, 901, 3
5999, 2975, 25
3969, 2951, 20
6179, 1849, 25
3548, 4255, 20
1085, 3478, 24
1682, 3285, 18
1107, 2927, 11
919, 3271, 19
990, 2980, 14
499, 3468, 21
3382, 3525, 13
87, 2715, 13
5204, 3735, 4
3961, 3349, 3
5011, 1456, 13
4528, 2477, 6
728, 2073, 12
3290, 4447, 22
3481, 4474, 22

4 RF

set.seed(317)
rfdat <- data.table(gaba = as.factor(cl$gaba), sf0)
rf1 <- randomForest(gaba ~ ., data = rfdat)

#set.seed(317)
set.seed(2^13)
train <- sample(nrow(rfdat), 100)
test <- setdiff(1:nrow(rfdat), train)
table(rfdat[test,]$gaba)

## 
##   0   1 
## 123  13

rf2 <- randomForest(gaba ~ ., data = rfdat[train,], importance = TRUE)
print(rf2)

## 
## Call:
##  randomForest(formula = gaba ~ ., data = rfdat[train, ], importance = TRUE) 
##                Type of random forest: classification
##                      Number of trees: 500
## No. of variables tried at each split: 3
## 
##         OOB estimate of  error rate: 3%
## Confusion matrix:
##    0 1 class.error
## 0 91 0   0.0000000
## 1  3 6   0.3333333

rf2.pred <- predict(rf2, newdata = rfdat[test,-c('gaba')])

table(rf2.pred, rfdat[test,]$gaba)

##         
## rf2.pred   0   1
##        0 122   2
##        1   1  11

varImpPlot(rf2)

Collman15v2 Gaba comparisons

Jesse Leigh Patsolic