abikoushi · December 18, 2025 01:11 · abikoushi · Dec 18, 2025
diff --git a/overparametrize.R b/overparametrize.R
 library(moltenNMF)
 library(Matrix)

 df = expand.grid(letters[1:2], LETTERS[1:2])
 X = sparse_onehot(~. , data = df)

 A=matrix(c(0.5,0.5,0.5,0.5,
           0,1,0,0,
           0,0,0,1), 4,3)

 print(A)

 Xs = sparse.model.matrix(~. , data = df)
 print(all(X%*%A==Xs))

 ###

 set_attr_modelmat <- function(X){
  if(!is.null(attr(X, "assign"))){
    attr(X, "indices") <- c(0L, cumsum(rle(attr(X, "assign"))$lengths))    
  }
  labs <- names(attr(X, "contrasts"))
  if(!is.null(labs)){
    attr(X, "term.labels") <- labs
    if(!is.null(X@Dimnames[[2]])){
      attr(X, "value.labels") <- sub(paste(labs, collapse = "|"), "", X@Dimnames[[2]])    
    }
  }
  return(X)
 }

 df = as.data.frame(Titanic)
 f = Freq ~ Class + Sex + Age + Survived
 X_s = sparse_onehot(f, data = df) #冗長

 L=2
 system.time({
  out_s <- mNMF_vb.default(df$Freq, X = X_s, L = L, iter = 1000)
 })


 X = sparse.model.matrix(f, data = df) #フルランク
 X = set_attr_modelmat(X)

 system.time({
  out <- mNMF_vb.default(df$Freq, X = X, L = L, iter = 1000)
 })

 plot(out_s$ELBO[-1], type="l", lty=2)
 lines(out$ELBO[-1], type="l")

 V = (out$shape/out$rate)
 V_s = (out_s$shape/out_s$rate)

 fit = product_m.default(X, V)
 fit_s = product_m.default(X_s, V_s)

 plot(df$Freq, fit)
 points(df$Freq, fit_s, col="royalblue", pch=2)
 abline(0,1,lty=2)

 fullranktrans <- function(X){
  ind = attr(X, "indices")
  termlen = length(ind[-1])
  A = matrix(0,ind[length(ind)], ind[length(ind)]-termlen+1)
  for(k in 1:termlen){
    start = ind[k] + 2
    for(i in start:ind[-1][k]){
      A[i,i-k+1] <- 1
    }
  }
  A[,1] <- 1/termlen
  return(A)
 }

 A = fullranktrans(X_s)
 print(all(X==X_s%*%A))
 #[1] TRUE

 V2 =exp(A%*%log(V))
 image(V_s)
 image(V2)
 cor(V_s,V2)

 fit2 = product_m.default(X_s, V2)
 plot(df$Freq, fit2)
 points(df$Freq, fit_s, col="royalblue", pch=2)
 abline(0,1,lty=2)
	library(moltenNMF)
	library(Matrix)

	df = expand.grid(letters[1:2], LETTERS[1:2])
	X = sparse_onehot(~. , data = df)

	A=matrix(c(0.5,0.5,0.5,0.5,
	0,1,0,0,
	0,0,0,1), 4,3)

	print(A)

	Xs = sparse.model.matrix(~. , data = df)
	print(all(X%*%A==Xs))

	###

	set_attr_modelmat <- function(X){
	if(!is.null(attr(X, "assign"))){
	attr(X, "indices") <- c(0L, cumsum(rle(attr(X, "assign"))$lengths))
	}
	labs <- names(attr(X, "contrasts"))
	if(!is.null(labs)){
	attr(X, "term.labels") <- labs
	if(!is.null(X@Dimnames[[2]])){
	attr(X, "value.labels") <- sub(paste(labs, collapse = "\|"), "", X@Dimnames[[2]])
	}
	}
	return(X)
	}

	df = as.data.frame(Titanic)
	f = Freq ~ Class + Sex + Age + Survived
	X_s = sparse_onehot(f, data = df) #冗長

	L=2
	system.time({
	out_s <- mNMF_vb.default(df$Freq, X = X_s, L = L, iter = 1000)
	})


	X = sparse.model.matrix(f, data = df) #フルランク
	X = set_attr_modelmat(X)

	system.time({
	out <- mNMF_vb.default(df$Freq, X = X, L = L, iter = 1000)
	})

	plot(out_s$ELBO[-1], type="l", lty=2)
	lines(out$ELBO[-1], type="l")

	V = (out$shape/out$rate)
	V_s = (out_s$shape/out_s$rate)

	fit = product_m.default(X, V)
	fit_s = product_m.default(X_s, V_s)

	plot(df$Freq, fit)
	points(df$Freq, fit_s, col="royalblue", pch=2)
	abline(0,1,lty=2)

	fullranktrans <- function(X){
	ind = attr(X, "indices")
	termlen = length(ind[-1])
	A = matrix(0,ind[length(ind)], ind[length(ind)]-termlen+1)
	for(k in 1:termlen){
	start = ind[k] + 2
	for(i in start:ind[-1][k]){
	A[i,i-k+1] <- 1
	}
	}
	A[,1] <- 1/termlen
	return(A)
	}

	A = fullranktrans(X_s)
	print(all(X==X_s%*%A))
	#[1] TRUE

	V2 =exp(A%*%log(V))
	image(V_s)
	image(V2)
	cor(V_s,V2)

	fit2 = product_m.default(X_s, V2)
	plot(df$Freq, fit2)
	points(df$Freq, fit_s, col="royalblue", pch=2)
	abline(0,1,lty=2)
No results found