jennyfarmer
diff --git a/‎ChebyShev.cpp‎
Lines changed: 78 additions & 0 deletions b/‎ChebyShev.cpp‎
Lines changed: 78 additions & 0 deletions
diff --git a/‎ChebyShev.h‎
Lines changed: 40 additions & 0 deletions b/‎ChebyShev.h‎
Lines changed: 40 additions & 0 deletions
diff --git a/‎CompilePDF.m‎
Lines changed: 1 addition & 0 deletions b/‎CompilePDF.m‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎EstimatePDF.cpp‎
Lines changed: 141 additions & 0 deletions b/‎EstimatePDF.cpp‎
Lines changed: 141 additions & 0 deletions
diff --git a/‎EstimatePDF.h‎
Lines changed: 26 additions & 0 deletions b/‎EstimatePDF.h‎
Lines changed: 26 additions & 0 deletions
diff --git a/‎EstimatePDF.m‎
Lines changed: 73 additions & 0 deletions b/‎EstimatePDF.m‎
Lines changed: 73 additions & 0 deletions
diff --git a/‎FigureSettings.m‎
Lines changed: 19 additions & 0 deletions b/‎FigureSettings.m‎
Lines changed: 19 additions & 0 deletions
@@ -0,0 +1,78 @@
+/* 
+ * PDF Estimator:  A non-parametric probability density estimation tool based on maximum entropy
+ * File:   ChebyShev.cpp
+ * Copyright (C) 2018
+ * Jenny Farmer [email protected]
+ * Donald Jacobs [email protected]
+ * 
+ * This program is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published 
+ * by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. This program is distributed in 
+ * the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR 
+ * PURPOSE.  See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with 
+ * this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+
+#include "ChebyShev.h"
+
+ChebyShev::ChebyShev() {
+   
+}
+
+ChebyShev::ChebyShev(const ChebyShev& orig) {
+}
+
+ChebyShev::~ChebyShev() {
+}
+
+void ChebyShev::initialize(double dzLocal[], int sizeLocal) {
+    this->size = sizeLocal;
+    this->dz = dzLocal;
+    vector <double> zeroT;
+    vector <double> oneT;
+    vector <double> twoT;
+
+    for (int z = 0; z < size; z++) {
+        double x = -1 + dz[z]*2;
+        zeroT.push_back(1);
+        oneT.push_back(x);
+        twoT.push_back(2*x*oneT[z] - 1);
+    }
+    termsT.push_back(zeroT);
+    termsT.push_back(oneT);
+    termsT.push_back(twoT);
+}
+
+double* ChebyShev::getTerms(unsigned mode) {   
+    if (termsT.size() <= mode) {
+        vector <double> test = addMode(mode);
+        return &test[0];
+    } else {
+        return &termsT[mode][0];
+    }
+}
+
+vector < vector < double > > ChebyShev::getAllTerms(unsigned mode) {
+    for (unsigned i = 0; i < mode; i++) {
+        if (termsT.size() <= i) {
+            addMode(i);
+        }
+    }
+    return termsT;
+}
+
+
+vector <double> ChebyShev::addMode(int mode) {        
+         
+        vector <double> T = termsT.at(mode-1);
+        vector <double> Tprev = termsT.at(mode-2);
+        vector <double> Tnext; 
+        double x = 0;       
+               
+        for (int z = 0; z < size; z++) {
+            x = -1 + 2*dz[z];
+            Tnext.push_back(2*x*T[z] - Tprev[z]);
+        }
+        termsT.push_back(Tnext);
+        return Tnext;
+    }
+    
@@ -0,0 +1,40 @@
+/*  
+ * PDF Estimator:  A non-parametric probability density estimation tool based on maximum entropy
+ * File:   ChebyShev.h
+ * Copyright (C) 2018
+ * Jenny Farmer [email protected]
+ * Donald Jacobs [email protected]
+ * 
+ * This program is free software: you can redistribute it and/or modify it under the terms of the GNU General Public License as published 
+ * by the Free Software Foundation, either version 3 of the License, or (at your option) any later version. This program is distributed in 
+ * the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR 
+ * PURPOSE.  See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with 
+ * this program.  If not, see <http://www.gnu.org/licenses/>.
+ */
+
+#ifndef CHEBYSHEV_HPP
+#define	CHEBYSHEV_HPP
+
+#include <vector>
+
+using namespace std;
+class ChebyShev {
+public:
+    ChebyShev();
+    ChebyShev(const ChebyShev& orig);
+    virtual ~ChebyShev();
+    void initialize(double dzLocal[], int sizeLocal);
+    double * getTerms(unsigned mode);
+    vector < vector < double > >  getAllTerms(unsigned mode);
+    
+private:         
+    int size;    
+    double * dz;
+    vector < vector<double> > termsT;
+    
+    vector <double> addMode(int mode);
+    
+};
+
+#endif	/* CHEBYSHEV_HPP */
+
@@ -0,0 +1 @@
+mex -O  'EstimatePDF.cpp' 'OutputControl.cpp' 'callPDF.cpp' 'WriteResults.cpp' 'Score.cpp' 'ScoreLL.cpp' 'ScoreQZ.cpp' 'MinimizeScore.cpp' 'InputParameters.cpp' 'InputData.cpp' 'ChebyShev.cpp'
@@ -0,0 +1,141 @@
+/* 
+
+ * File:   PDFMainMatlab.cpp
+ * Author: jenny
+ * 
+ * Created on December 3, 2018, 8:32 AM
+ */
+
+
+#include "EstimatePDF.h"
+#include "callPDF.h" 
+
+    
+
+void MexFunction::operator()(matlab::mex::ArgumentList outputs, matlab::mex::ArgumentList inputs) {   
+
+    int nParameters = inputs.size();    
+    matlabPtr = getEngine();
+    out.debug = true;    
+
+    matlab::data::ArrayFactory factory;
+    if (nParameters < 1) {        
+        out.displayError(matlabPtr, "Data sample required");
+    }
+    if (nParameters > 2) {        
+        out.displayError(matlabPtr, "Only two input arguements allowed:  data sample and parameter structure");
+    }            
+
+    TypedArray<double> doubleArray = std::move(inputs[0]);
+    int sampleSize = doubleArray.getNumberOfElements();
+    if (sampleSize < 3) {
+        out.displayError(matlabPtr, "Must have at least three data points in sample");
+    }
+    double sampleData[sampleSize];
+    int i = 0;
+    for (auto& elem : doubleArray) {
+        sampleData[i++] = elem;
+    }           
+
+    callPDF *pd = new callPDF(matlabPtr);   
+
+    if (nParameters > 1) {
+        StructArray const matlabStructArray = inputs[1];
+        auto fields = matlabStructArray.getFieldNames();
+        std::vector<std::string> fieldNames(fields.begin(), fields.end());
+        int count = 0;
+        Array structField;
+        for (std::vector<string>::iterator iter = fieldNames.begin(); iter != fieldNames.end(); ++iter) {
+            string field = *iter;          
+            if (strcmp(field.c_str(), "SURDtarget") == 0) {                
+                structField = matlabStructArray[0][fieldNames[count++]];
+                pd->setSURDtarget(structField[0]);
+            } else if (strcmp(field.c_str(), "SURDmin") == 0) {
+                structField = matlabStructArray[0][fieldNames[count++]];
+                pd->setSURDmin(structField[0]);
+            } else if (strcmp(field.c_str(), "SURDmax") == 0) {                
+                structField = matlabStructArray[0][fieldNames[count++]];
+                pd->setSURDmax(structField[0]);        
+            } else if (strcmp(field.c_str(), "scoreType") == 0) {                
+                structField = matlabStructArray[0][fieldNames[count++]];
+                pd->setScoreType((CharArray(structField)).toAscii());
+            } else if (strcmp(field.c_str(), "LagrangeMin") == 0) {
+                structField = matlabStructArray[0][fieldNames[count++]];                
+                pd->setLagrangeMin(structField[0]);
+            } else if (strcmp(field.c_str(), "LagrangeMax") == 0) {                
+                structField = matlabStructArray[0][fieldNames[count++]];
+                pd->setLagrangeMax(structField[0]);
+            } else if (strcmp(field.c_str(), "integrationPoints") == 0) {                
+                structField = matlabStructArray[0][fieldNames[count++]];                
+                pd->setPoints(structField[0]);
+            } else if (strcmp(field.c_str(), "lowBound") == 0) {                
+                structField = matlabStructArray[0][fieldNames[count++]];
+                pd->setLow(structField[0]);
+            } else if (strcmp(field.c_str(), "highBound") == 0) {                
+                structField = matlabStructArray[0][fieldNames[count++]];
+                pd->setHigh(structField[0]);
+            } else if (strcmp(field.c_str(), "outlierCutoff") == 0) {
+                structField = matlabStructArray[0][fieldNames[count++]];
+                pd->setOutlierCutoff(structField[0]);            
+            } else if (strcmp(field.c_str(), "partition") == 0) {                
+                structField = matlabStructArray[0][fieldNames[count++]];
+                pd->setPartitionSize(structField[0]);
+            } else if (strcmp(field.c_str(), "debug") == 0) {                
+                structField = matlabStructArray[0][fieldNames[count++]];
+                pd->setDebug(structField[0]);  
+            } else if (strcmp(field.c_str(), "minVariance") == 0) {                
+                structField = matlabStructArray[0][fieldNames[count++]];
+                pd->setVariance(structField[0]);
+            } else if (strcmp(field.c_str(), "adaptiveDx") == 0) {
+                structField = matlabStructArray[0][fieldNames[count++]];
+                pd->setAdaptiveDx(structField[0]);
+            } else {
+                string unknown = "Unknown parameter: " + field;
+                out.displayError(matlabPtr, unknown);
+            }                
+        }  
+    }                     
+    pd->makeCall(sampleSize, sampleData);               
+
+    vector <int> failed;
+    failed.push_back(pd->solutionFailed);
+    ArrayDimensions sz = {failed.size(), 1, 1};
+    TypedArray<int> MsolutionFailed = factory.createArray(sz, failed.begin(), failed.end());
+    outputs[0] = MsolutionFailed;             
+
+    if (!pd->solutionFailed) {
+        sz = {pd->Vx.size(), 1, 1};        
+        TypedArray<double> Mx = factory.createArray(sz, pd->Vx.begin(), pd->Vx.end());
+        outputs[1] = Mx;
+        sz = {pd->Vpdf.size(), 1, 1};
+        TypedArray<double> Mpdf = factory.createArray(sz, pd->Vpdf.begin(), pd->Vpdf.end());
+        outputs[2] = Mpdf;
+        sz = {pd->Vcdf.size(), 1, 1};
+        TypedArray<double> Mcdf = factory.createArray(sz, pd->Vcdf.begin(), pd->Vcdf.end());
+        outputs[3] = Mcdf;
+        sz = {pd->Vsqr.size(), 1, 1};
+        TypedArray<double> Msqr = factory.createArray(sz, pd->Vsqr.begin(), pd->Vsqr.end());
+        outputs[4] = Msqr;
+        sz = {pd->Vlagrange.size(), 1, 1};
+        TypedArray<double> Mlagrange = factory.createArray(sz, pd->Vlagrange.begin(), pd->Vlagrange.end());
+        outputs[5] = Mlagrange;                            
+
+        vector <double> threshold;
+        threshold.push_back(pd->thresholdScore);
+        sz = {threshold.size(), 1, 1};
+        TypedArray<double> Mthreshold = factory.createArray(sz, threshold.begin(), threshold.end());
+        outputs[6] = Mthreshold;      
+
+        vector <double> confidence;
+        confidence.push_back(pd->confidenceScore);
+        sz = {confidence.size(), 1, 1};
+        TypedArray<double> Mconfidence = factory.createArray(sz, confidence.begin(), confidence.end());
+        outputs[7] = Mconfidence;         
+
+        sz = {pd->Vr.size(), 1, 1};
+        TypedArray<double> Mr = factory.createArray(sz, pd->Vr.begin(), pd->Vr.end());
+        outputs[8] = Mr;
+    } 
+    delete pd;  
+
+}
@@ -0,0 +1,26 @@
+/* 
+ * File:   EstimatePDF.h
+ * Author: jenny
+ *
+ * Created on February 2, 2019, 2:00 PM
+ */
+
+#ifndef ESTIMATEPDF_H
+#define	ESTIMATEPDF_H
+
+#include "mexAdapter.hpp"
+#include "OutputControl.h"
+
+using namespace matlab::data;
+
+class MexFunction : public matlab::mex::Function {
+    
+private:
+    std::shared_ptr<matlab::engine::MATLABEngine> matlabPtr;        
+    OutputControl out;
+    
+public:
+    void operator()(matlab::mex::ArgumentList outputs, matlab::mex::ArgumentList inputs);
+};
+
+#endif
@@ -0,0 +1,73 @@
+% EstimatePDF computes a probability density estimate for a one-dimensional
+% data sample based on a nonparametric maximum entropy method.  For additional 
+% usage information see readme.txt file with this installation.
+% For conceptual details of the method and algorithm, see:
+%
+% Farmer, Jenny and Donald Jacobs (2018). 
+% "High throughput nonparametric probability density estimation." PLoS One 13(5): e0196937.
+%
+%
+% [FAILED, XI, F, CDF, SQR, LAGRANGE, SCORE, CONFIDENCE, SURD] = EstimatePDF(X) 
+% Computes the density estimate of data in sample X with default settings.
+% Outputs returned are as follows:
+%
+%   FAILED              non-zero if solution not found
+%   XI                  relative spacing along x-axis for density estimate
+%   F                   probability density function for estimate (PDF)
+%   CDF                 cummulative density function for estimate
+%   SQR                 scaled quantile residual for sample data
+%   LAGRANGE            Lagrange multipliers estimated to construct PDF
+%   SCORE               Value of final score for estimate
+%   CONFIDENCE          Confidence threshold for estimate
+%   SURD                sampled uniform random data
+%
+% [...] = EstimatePDF(X, PARM) Computes the density estimate of data in 
+% sample X with parameters in a structure defined in PARM.  Parameter options 
+% are listed below.  
+% 
+% Parameter name        Default value               Description
+%
+% lowBound              calculated                  set fixed lower bound
+% highBound             calculated                  set fixed upper bound
+% integrationPoints 	max(1500, 200/n + 200)      data resolution; n=sample size
+% LagrangeMin           1                           minimum number of weighted expansions  
+% LagrangeMax           200                         maximum number of weighted expansions 		
+% SURDtarget            40                          target confidence threshold 
+% SURDmin               5                           minimum conficence threshold accepted
+% SURDmax               100                         maximum conficence threshold accepted
+% scoreType             ‘QZ'                        Change to ‘LL’ for log likelihood scoring
+% debug                 false                       detailed output to console
+% partition             1025                        Initial data partition for scoring, set to zero for no partitioning
+% outlierCutoff         7                           Set to zero to disable outlier detection
+% adaptiveDx            true                        Set to false for uniformly spaced numerical solution
+% 		
+%
+% Example:  Plot estimated density for a Normal distribution using default
+% settings:
+%   [failed, y, pdf] = EstimatePDF(randn(1000, 1));
+%   if ~failed
+%       plot(y, pdf);
+%   end
+%
+% Example:  Plot estimated cummulative density for a uniform distribution defined on
+% the interval (0 1):
+%   parms.lowBound = 0;
+%   parms.highBound = 1;
+%   [failed, y, pdf, cdf] = EstimatePDF(rand(1000, 1), parms);
+%   if ~failed
+%       plot(y, cdf);
+%   end
+%
+% Example:  Plot estimated  density for an exponential distribution defined on
+% the interval (0 inf), requiring at least 2 Langrange multipliers:
+%   parms.lowBound = 0;
+%   parms.LagrangeMin = 2;
+%   [failed, y, pdf] = EstimatePDF(exprnd(1, 1000, 1), parms);
+%   if ~failed
+%       plot(y, pdf);
+%   end
+
+
+
+
+
@@ -0,0 +1,19 @@
+function FigureSettings()
+%FigureSettings creates publication-quality default settings for all
+%subsequent plots in current MATLAB session.
+    set(0,'DefaultFigureColor','white')
+    fig.InvertHardcopy = 'off';
+    width = 6;                                                                 % Width in inches
+    height = 4;                                                                % Height in inches
+    alw = 1.5;                                                                 % AxesLineWidth 
+    fsz = 14;                                                                  % Fontsize 
+    lw = 1.5;                                                                  % LineWidth 
+    msz = 8;                                                                   % MarkerSize 
+    set(0,'defaultAxesFontSize',fsz); 
+    set(0,'defaultLineLineWidth',lw);   
+    set(0,'defaultLineMarkerSize',msz); 
+    set(0,'defaultAxesLineWidth',alw);
+    defpos = get(0,'defaultFigurePosition');
+    set(0,'defaultFigurePosition', [defpos(1) defpos(2) width*100, height*100]); 
+    set(0,'defaultFigurePosition', [400, 50, width*100, height*110]); 
+end
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+mex -O 'EstimatePDF.cpp' 'OutputControl.cpp' 'callPDF.cpp' 'WriteResults.cpp' 'Score.cpp' 'ScoreLL.cpp' 'ScoreQZ.cpp' 'MinimizeScore.cpp' 'InputParameters.cpp' 'InputData.cpp' 'ChebyShev.cpp'`