README

The package abclass provides implementations of the multi-category angle-based classifiers (Zhang & Liu, 2014) with the large-margin unified machines (Liu, et al., 2011) for high-dimensional data.

Installation

install.packages("abclass")

if (! require(remotes)) install.packages("remotes")
remotes::install_github("wenjie2wang/abclass", upgrade = "never")

Getting Started

library(abclass)
set.seed(123)

## toy examples for demonstration purpose
## reference: example 1 in Zhang and Liu (2014)
ntrain <- 100 # size of training set
ntest <- 1000 # size of testing set
p0 <- 10      # number of actual predictors
p1 <- 100     # number of random predictors
k <- 5        # number of categories

n <- ntrain + ntest; p <- p0 + p1
train_idx <- seq_len(ntrain)
y <- sample(k, size = n, replace = TRUE)         # response
mu <- matrix(rnorm(p0 * k), nrow = k, ncol = p0) # mean vector
## normalize the mean vector so that they are distributed on the unit circle
mu <- mu / apply(mu, 1, function(a) sqrt(sum(a ^ 2)))
x0 <- t(sapply(y, function(i) rnorm(p0, mean = mu[i, ], sd = 0.25)))
x1 <- matrix(rnorm(p1 * n, sd = 0.3), nrow = n, ncol = p1)
x <- cbind(x0, x1)
train_x <- x[train_idx, ]
test_x <- x[- train_idx, ]
y <- factor(paste0("label_", y))
train_y <- y[train_idx]
test_y <- y[- train_idx]

### regularization through elastic-net penalty
## logistic deviance loss
model1 <- abclass(train_x, train_y, nlambda = 100,
                  nfolds = 3, loss = "logistic")
pred1 <- predict(model1, test_x)
table(test_y, pred1)

mean(test_y == pred1) # accuracy

## exponential loss approximating AdaBoost
model2 <- abclass(train_x, train_y, nlambda = 100,
                  nfolds = 3, loss = "boost")
pred2 <- predict(model2, test_x, s = "cv_1se")
table(test_y, pred2)

mean(test_y == pred2) # accuracy

## hybrid hinge-boost loss
model3 <- abclass(train_x, train_y, nlambda = 100,
                  nfolds = 3, loss = "hinge-boost")
pred3 <- predict(model3, test_x)
table(test_y, pred3)

mean(test_y == pred3) # accuracy

## large-margin unified loss
model4 <- abclass(train_x, train_y, nlambda = 100,
                  nfolds = 3, loss = "lum")
pred4 <- predict(model4, test_x)
table(test_y, pred4)

mean(test_y == pred4) # accuracy

### variable selection via group lasso
## logistic deviance loss
model1 <- abclass(train_x, train_y, nlambda = 100, nfolds = 3,
                  grouped = TRUE, loss = "logistic")
pred1 <- predict(model1, test_x, s = "cv_1se")
table(test_y, pred1)

mean(test_y == pred1) # accuracy

## exponential loss approximating AdaBoost
model2 <- abclass(train_x, train_y, nlambda = 100, nfolds = 3,
                  grouped = TRUE, loss = "boost")
pred2 <- predict(model2, test_x, s = "cv_1se")
table(test_y, pred2)

mean(test_y == pred2) # accuracy

## hybrid hinge-boost loss
model3 <- abclass(train_x, train_y, nlambda = 100, nfolds = 3,
                  grouped = TRUE, loss = "hinge-boost")
pred3 <- predict(model3, test_x)
table(test_y, pred3)

mean(test_y == pred3) # accuracy

## large-margin unified loss
model4 <- abclass(train_x, train_y, nlambda = 100, nfolds = 3,
                  grouped = TRUE, loss = "lum")
pred4 <- predict(model4, test_x)
table(test_y, pred4)

abclass

Installation

Getting Started

References

License