require 'statsample' samples=150 variables=30 iterations=50 Statsample::Analysis.store(Statsample::Factor::ParallelAnalysis) do Daru.lazy_update = true rng = Distribution::Normal.rng() f1 = rnorm(samples) f2 = rnorm(samples) f3 = rnorm(samples) vectors={} variables.times do |i| vectors["v#{i}".to_sym] = Daru::Vector.new(samples.times.collect {|nv| f1[nv]*i+(f2[nv]*(15-i))+((f3[nv]*(30-i))*1.5)*rng.call}) vectors["v#{i}".to_sym].rename "Vector #{i}" end ds = Daru::DataFrame.new(vectors) pa=Statsample::Factor::ParallelAnalysis.new(ds, :iterations=>iterations, :debug=>true) pca=pca(cor(ds)) echo "There are 3 real factors on data" summary pca echo "Traditional Kaiser criterion (k>1) returns #{pca.m} factors" summary pa echo "Parallel Analysis returns #{pa.number_of_factors} factors to preserve" Daru.lazy_update = false end Statsample::Analysis.run_batch