void calculateProbabilities ( const std vector train, double probabilities MAX CLASS MAX COLS 1 3 , double classPriors MAX CLASS , double lambda ) int classCounts MAX CLASS 0 for ( int c 0 c MAX CLASS c ) for ( int i 0 i MAX COLS 1 i ) for ( int v 0 v 3 v ) probabilities c i v lambda for ( const auto record train ) classCounts record classLabel for ( size t i 0 i record attributes size ( ) i ) if ( record attributes i MISSING ) probabilities record classLabel i record attributes i for ( int c 0 c MAX CLASS c ) classPriors c static cast ( classCounts c ) train size ( ) for ( int i 0 i MAX COLS 1 i ) double total classCounts c 3 lambda for ( int v 0 v 3 v ) probabilities c i v total ClassLabel naiveBayesPredict ( const Record record, const double probabilities MAX CLASS MAX COLS 1 3 , const double classPriors MAX CLASS ) double logProbs MAX CLASS std log ( classPriors DEMOCRAT ) , std log ( classPriors REPUBLICAN ) for ( int c 0 c MAX CLASS c ) for ( size t i 0 i record attributes size ( ) i ) if ( record attributes i MISSING ) logProbs c std log ( probabilities c i record attributes i ) if ( logProbs DEMOCRAT logProbs REPUBLICAN ) return DEMOCRAT else return REPUBLICAN void evaluateModel ( const std vector data, const double probabilities MAX CLASS MAX COLS 1 3 , const double classPriors MAX CLASS , double accuracy ) int correct 0 for ( const auto record data ) if ( naiveBayesPredict ( record , probabilities, classPriors ) record classLabel ) correct accuracy static cast ( correct ) data size ( ) void crossValidate ( const std vector records, double lambda, double averageAccuracy, double stdDev, std vector foldAccuracies ) size t foldSize records size ( ) 1 0 foldAccuracies clear ( ) for ( int i 0 i 1 0 i ) std vector train, test for ( size t j 0 j records size ( ) j ) if ( j i foldSize j ( i 1 ) foldSize ) test push back ( records j ) else train push back ( records j ) double probabilities MAX CLASS MAX COLS 1 3 double classPriors MAX CLASS calculateProbabilities ( train , probabilities, classPriors, lambda ) double foldAccuracy evaluateModel ( test , probabilities, classPriors, foldAccuracy ) foldAccuracies push back ( foldAccuracy ) double sum 0 0 for ( size t i 0 i foldAccuracies size ( ) i ) sum foldAccuracies i double mean sum foldAccuracies size ( ) double sqSum 0 0 for ( size t i 0 i foldAccuracies size ( ) i ) sqSum ( foldAccuracies i mean ) ( foldAccuracies i mean ) stdDev std sqrt ( sqSum foldAccuracies size ( ) ) averageAccuracy mean Optimize this C code for Naive Bayes Classification of republicans and democrats dataset Can you make it more understandable and clear, and to be connected In this particular code is implemented naive bayes with Laplas and logarithm for handling the unexpected errors and deviations

The Answer is in the image, click to view ...

Question: void calculateProbabilities ( const std::vector& train, double probabilities [ MAX _ CLASS ] [ MAX _ COLS - 1 ] [ 3 ] , double

void calculateProbabilities

(

const std::vector& train, double probabilities

[

MAX

_

CLASS

] [

MAX

_

COLS

- 1] [3],

double classPriors

[

MAX

_

CLASS

],

double lambda

) {

int classCounts

[

MAX

_

CLASS

] = {0}

;

for

(

int c

= 0

; c

<

MAX

_

CLASS;

+ +

) {

for

(

int i

= 0

; i

<

MAX

_

COLS

- 1

;

+ +

) {

for

(

int v

= 0

; v

< 3

;

+ +

) {

probabilities

[

] [

] [

] =

lambda;

}

}

}

for

(

const auto& record : train

) {

classCounts

[

record

.

classLabel

] + +

;

for

(

size

_

t i

= 0

; i

<

record.attributes.size

()

;

+ +

) {

(

record

.

attributes

[

]! =

MISSING

) {

probabilities

[

record

.

classLabel

] [

] [

record

.

attributes

[

]] + +

;

}

}

}

for

(

int c

= 0

; c

<

MAX

_

CLASS;

+ +

) {

classPriors

[

] =

static

_

cast

(

classCounts

[

]) /

train.size

()

;

for

(

int i

= 0

; i

<

MAX

_

COLS

- 1

;

+ +

) {

double total

=

classCounts

[

] + 3 *

lambda;

for

(

int v

= 0

; v

< 3

;

+ +

) {

probabilities

[

] [

] [

] / =

total;

}

}

}

}

ClassLabel naiveBayesPredict

(

const Record& record, const double probabilities

[

MAX

_

CLASS

] [

MAX

_

COLS

- 1] [3],

const double classPriors

[

MAX

_

CLASS

]) {

double logProbs

[

MAX

_

CLASS

] = {

std::log

(

classPriors

[

DEMOCRAT

]),

std::log

(

classPriors

[

REPUBLICAN

])}

;

for

(

int c

= 0

; c

<

MAX

_

CLASS;

+ +

) {

for

(

size

_

t i

= 0

; i

<

record.attributes.size

()

;

+ +

) {

(

record

.

attributes

[

]! =

MISSING

) {

logProbs

[

] + =

std::log

(

probabilities

[

] [

] [

record

.

attributes

[

]])

;

}

}

}

(

logProbs

[

DEMOCRAT

] >

logProbs

[

REPUBLICAN

]) {

return DEMOCRAT;

}

else

{

return REPUBLICAN;

}

}

void evaluateModel

(

const std::vector& data, const double probabilities

[

MAX

_

CLASS

] [

MAX

_

COLS

- 1] [3],

const double classPriors

[

MAX

_

CLASS

],

double& accuracy

) {

int correct

= 0

;

for

(

const auto& record : data

) {

(

naiveBayesPredict

(

record

,

probabilities, classPriors

) = =

record.classLabel

) {

correct

+ +

;

}

}

accuracy

=

static

_

cast

(

correct

) /

data.size

()

;

}

void crossValidate

(

const std::vector& records, double lambda, double& averageAccuracy, double& stdDev, std::vector& foldAccuracies

) {

size

_

t foldSize

=

records.size

() / 10

;

foldAccuracies.clear

()

;

for

(

int i

= 0

; i

< 10

;

+ +

) {

std::vector train, test;

for

(

size

_

t j

= 0

; j

<

records.size

()

;

+ +

) {

(

> =

*

foldSize && j

< (

+ 1) *

foldSize

) {

test.push

_

back

(

records

[

])

;

}

else

{

train.push

_

back

(

records

[

])

;

}

}

double probabilities

[

MAX

_

CLASS

] [

MAX

_

COLS

- 1] [3] = {}

;

double classPriors

[

MAX

_

CLASS

] = {}

;

calculateProbabilities

(

train

,

probabilities, classPriors, lambda

)

;

double foldAccuracy;

evaluateModel

(

test

,

probabilities, classPriors, foldAccuracy

)

;

foldAccuracies.push

_

back

(

foldAccuracy

)

;

}

double sum

= 0.0

;

for

(

size

_

t i

= 0

; i

<

foldAccuracies.size

()

;

+ +

) {

sum

+ =

foldAccuracies

[

]

;

}

double mean

=

sum

/

foldAccuracies.size

()

;

double sqSum

= 0.0

;

for

(

size

_

t i

= 0

; i

<

foldAccuracies.size

()

;

+ +

) {

sqSum

+ = (

foldAccuracies

[

] -

mean

) * (

foldAccuracies

[

] -

mean

)

;

}

stdDev

=

std::sqrt

(

sqSum

/

foldAccuracies.size

())

;

averageAccuracy

=

mean;

}

Optimize this C

+ +

code for Naive Bayes Classification of republicans and democrats dataset. Can you make it more understandable and clear, and to be connected? In this particular code is implemented naive bayes with Laplas and logarithm for handling the unexpected errors and deviations

Step by Step Solution

There are 3 Steps involved in it

1 Expert Approved Answer

Step: 1 Unlock blur-text-image

Question Has Been Solved by an Expert!

Get step-by-step solutions from verified subject matter experts

Step: 2 Unlock

Step: 3 Unlock

Students Have Also Explored These Related Programming Questions!

2.1 Bond class, fair value, duration & yield Let us write a "bond class" to perform various calculations relevant for bonds. A real bond class has a lot of data and class methods. We shall write a...

on c++ microsoft visual studio Scenario/Summary We have two separate goals this week: We are going to create an abstract Employee class and two pure virtual functions - calculatePay() and...

Scenario/Summary [THIS IS C++ LANGUAGE] We have two separate goals this week: We are going to create an abstract Employee class and two pure virtual functions - calculatePay() and displayEmployee()....

Code in C++ Question class Create a class for a question. 1 Question -text: string +setText(string): void +getTexti) const: string +display() const: void +Question +Question(string)...

I need help with this C++ homework. I just need it done in 1 file: Quiz.h which is derived from a class NAquestion and base class Question. so I will post these as well. I don't need the main.cpp....

In C++ Please. This program will have you implement in histogram.cpp a class whose interface is given in histogram.h, and you will write a driver program for it in main.cpp. The Histogram class...

Given the following program: #include #include using namespace std; struct point_t{ double x_coord, y_coord; }; class Point{ public: Point(); void set_point_data (double, double); double...

Please do this in c++ Parts A and B are required. Part C is optional and is worth 2 points extra credit (but must be submitted in addition to Part A and Part B). Make sure you have read and...

{{C++ , COMPLETE MAIN.CPP} DO NOT USE sanjeev2552's CODE AS THE ANSWER, IT IS WRONG}: Part A ( required ) - The Subset Sum Problem For Ints Create a simple main() and complete other needed globe...

Accounting In the capital projects fund, a $10 million par value bond was sold at 101. The premium is transferred to the debt service fund. Create the journal entries for both the capital projects...

Suppose that there are two firms in the market facing the market demand curve Q = 150 - P and with no costs of production. They produce identical products. 1 a) Suppose the two firms need to choose...

The FASB is responsible for all of the following except: Question 3 Answer a . communicating GAAP through the Codification b . setting accounting standards for US companies c . soliciting input from...

2 (10 points) EcoFresca (EF) has recently introduced a quantity-discount pricing strategy for the purchase of bottled water units from AquaPurify. For orders up to 15,000 units, AquaPurify ch