\documentclass[11pt,twoside]{article}\makeatletter

\IfFileExists{xcolor.sty}%
  {\RequirePackage{xcolor}}%
  {\RequirePackage{color}}
\usepackage{colortbl}
\usepackage{wrapfig}
\usepackage{ifxetex}
\ifxetex
  \usepackage{fontspec}
  \usepackage{xunicode}
  \catcode`⃥=\active \def⃥{\textbackslash}
  \catcode`❴=\active \def❴{\{}
  \catcode`❵=\active \def❵{\}}
  \def\textJapanese{\fontspec{Noto Sans CJK JP}}
  \def\textChinese{\fontspec{Noto Sans CJK SC}}
  \def\textKorean{\fontspec{Noto Sans CJK KR}}
  \setmonofont{DejaVu Sans Mono}
  
\else
  \IfFileExists{utf8x.def}%
   {\usepackage[utf8x]{inputenc}
      \PrerenderUnicode{–}
    }%
   {\usepackage[utf8]{inputenc}}
  \usepackage[english]{babel}
  \usepackage[T1]{fontenc}
  \usepackage{float}
  \usepackage[]{ucs}
  \uc@dclc{8421}{default}{\textbackslash }
  \uc@dclc{10100}{default}{\{}
  \uc@dclc{10101}{default}{\}}
  \uc@dclc{8491}{default}{\AA{}}
  \uc@dclc{8239}{default}{\,}
  \uc@dclc{20154}{default}{ }
  \uc@dclc{10148}{default}{>}
  \def\textschwa{\rotatebox{-90}{e}}
  \def\textJapanese{}
  \def\textChinese{}
  \IfFileExists{tipa.sty}{\usepackage{tipa}}{}
\fi
\def\exampleFont{\ttfamily\small}
\DeclareTextSymbol{\textpi}{OML}{25}
\usepackage{relsize}
\RequirePackage{array}
\def\@testpach{\@chclass
 \ifnum \@lastchclass=6 \@ne \@chnum \@ne \else
  \ifnum \@lastchclass=7 5 \else
   \ifnum \@lastchclass=8 \tw@ \else
    \ifnum \@lastchclass=9 \thr@@
   \else \z@
   \ifnum \@lastchclass = 10 \else
   \edef\@nextchar{\expandafter\string\@nextchar}%
   \@chnum
   \if \@nextchar c\z@ \else
    \if \@nextchar l\@ne \else
     \if \@nextchar r\tw@ \else
   \z@ \@chclass
   \if\@nextchar |\@ne \else
    \if \@nextchar !6 \else
     \if \@nextchar @7 \else
      \if \@nextchar (8 \else
       \if \@nextchar )9 \else
  10
  \@chnum
  \if \@nextchar m\thr@@\else
   \if \@nextchar p4 \else
    \if \@nextchar b5 \else
   \z@ \@chclass \z@ \@preamerr \z@ \fi \fi \fi \fi
   \fi \fi  \fi  \fi  \fi  \fi  \fi \fi \fi \fi \fi \fi}
\gdef\arraybackslash{\let\\=\@arraycr}
\def\@textsubscript#1{{\m@th\ensuremath{_{\mbox{\fontsize\sf@size\z@#1}}}}}
\def\Panel#1#2#3#4{\multicolumn{#3}{){\columncolor{#2}}#4}{#1}}
\def\abbr{}
\def\corr{}
\def\expan{}
\def\gap{}
\def\orig{}
\def\reg{}
\def\ref{}
\def\sic{}
\def\persName{}\def\name{}
\def\placeName{}
\def\orgName{}
\def\textcal#1{{\fontspec{Lucida Calligraphy}#1}}
\def\textgothic#1{{\fontspec{Lucida Blackletter}#1}}
\def\textlarge#1{{\large #1}}
\def\textoverbar#1{\ensuremath{\overline{#1}}}
\def\textquoted#1{‘#1’}
\def\textsmall#1{{\small #1}}
\def\textsubscript#1{\@textsubscript{\selectfont#1}}
\def\textxi{\ensuremath{\xi}}
\def\titlem{\itshape}
\newenvironment{biblfree}{}{\ifvmode\par\fi }
\newenvironment{bibl}{}{}
\newenvironment{byline}{\vskip6pt\itshape\fontsize{16pt}{18pt}\selectfont}{\par }
\newenvironment{citbibl}{}{\ifvmode\par\fi }
\newenvironment{docAuthor}{\ifvmode\vskip4pt\fontsize{16pt}{18pt}\selectfont\fi\itshape}{\ifvmode\par\fi }
\newenvironment{docDate}{}{\ifvmode\par\fi }
\newenvironment{docImprint}{\vskip 6pt}{\ifvmode\par\fi }
\newenvironment{docTitle}{\vskip6pt\bfseries\fontsize{22pt}{25pt}\selectfont}{\par }
\newenvironment{msHead}{\vskip 6pt}{\par}
\newenvironment{msItem}{\vskip 6pt}{\par}
\newenvironment{rubric}{}{}
\newenvironment{titlePart}{}{\par }

\newcolumntype{L}[1]{){\raggedright\arraybackslash}p{#1}}
\newcolumntype{C}[1]{){\centering\arraybackslash}p{#1}}
\newcolumntype{R}[1]{){\raggedleft\arraybackslash}p{#1}}
\newcolumntype{P}[1]{){\arraybackslash}p{#1}}
\newcolumntype{B}[1]{){\arraybackslash}b{#1}}
\newcolumntype{M}[1]{){\arraybackslash}m{#1}}
\definecolor{label}{gray}{0.75}
\def\unusedattribute#1{\sout{\textcolor{label}{#1}}}
\DeclareRobustCommand*{\xref}{\hyper@normalise\xref@}
\def\xref@#1#2{\hyper@linkurl{#2}{#1}}
\begingroup
\catcode`\_=\active
\gdef_#1{\ensuremath{\sb{\mathrm{#1}}}}
\endgroup
\mathcode`\_=\string"8000
\catcode`\_=12\relax

\usepackage[a4paper,twoside,lmargin=1in,rmargin=1in,tmargin=1in,bmargin=1in,marginparwidth=0.75in]{geometry}
\usepackage{framed}

\definecolor{shadecolor}{gray}{0.95}
\usepackage{longtable}
\usepackage[normalem]{ulem}
\usepackage{fancyvrb}
\usepackage{fancyhdr}
\usepackage{graphicx}
\usepackage{marginnote}

\renewcommand{\@cite}[1]{#1}


\renewcommand*{\marginfont}{\itshape\footnotesize}

\def\Gin@extensions{.pdf,.png,.jpg,.mps,.tif}

  \pagestyle{fancy}

\usepackage[pdftitle={Data Mining Approach to Prediction of Going Concern using Classification and Regression Tree (CART)},
 pdfauthor={}]{hyperref}
\hyperbaseurl{}

	 \paperwidth210mm
	 \paperheight297mm
              
\def\@pnumwidth{1.55em}
\def\@tocrmarg {2.55em}
\def\@dotsep{4.5}
\setcounter{tocdepth}{3}
\clubpenalty=8000
\emergencystretch 3em
\hbadness=4000
\hyphenpenalty=400
\pretolerance=750
\tolerance=2000
\vbadness=4000
\widowpenalty=10000

\renewcommand\section{\@startsection {section}{1}{\z@}%
     {-1.75ex \@plus -0.5ex \@minus -.2ex}%
     {0.5ex \@plus .2ex}%
     {\reset@font\Large\bfseries}}
\renewcommand\subsection{\@startsection{subsection}{2}{\z@}%
     {-1.75ex\@plus -0.5ex \@minus- .2ex}%
     {0.5ex \@plus .2ex}%
     {\reset@font\Large}}
\renewcommand\subsubsection{\@startsection{subsubsection}{3}{\z@}%
     {-1.5ex\@plus -0.35ex \@minus -.2ex}%
     {0.5ex \@plus .2ex}%
     {\reset@font\large}}
\renewcommand\paragraph{\@startsection{paragraph}{4}{\z@}%
     {-1ex \@plus-0.35ex \@minus -0.2ex}%
     {0.5ex \@plus .2ex}%
     {\reset@font\normalsize}}
\renewcommand\subparagraph{\@startsection{subparagraph}{5}{\parindent}%
     {1.5ex \@plus1ex \@minus .2ex}%
     {-1em}%
     {\reset@font\normalsize\bfseries}}


\def\l@section#1#2{\addpenalty{\@secpenalty} \addvspace{1.0em plus 1pt}
 \@tempdima 1.5em \begingroup
 \parindent \z@ \rightskip \@pnumwidth 
 \parfillskip -\@pnumwidth 
 \bfseries \leavevmode #1\hfil \hbox to\@pnumwidth{\hss #2}\par
 \endgroup}
\def\l@subsection{\@dottedtocline{2}{1.5em}{2.3em}}
\def\l@subsubsection{\@dottedtocline{3}{3.8em}{3.2em}}
\def\l@paragraph{\@dottedtocline{4}{7.0em}{4.1em}}
\def\l@subparagraph{\@dottedtocline{5}{10em}{5em}}
\@ifundefined{c@section}{\newcounter{section}}{}
\@ifundefined{c@chapter}{\newcounter{chapter}}{}
\newif\if@mainmatter 
\@mainmattertrue
\def\chaptername{Chapter}
\def\frontmatter{%
  \pagenumbering{roman}
  \def\thechapter{\@roman\c@chapter}
  \def\theHchapter{\roman{chapter}}
  \def\thesection{\@roman\c@section}
  \def\theHsection{\roman{section}}
  \def\@chapapp{}%
}
\def\mainmatter{%
  \cleardoublepage
  \def\thechapter{\@arabic\c@chapter}
  \setcounter{chapter}{0}
  \setcounter{section}{0}
  \pagenumbering{arabic}
  \setcounter{secnumdepth}{6}
  \def\@chapapp{\chaptername}%
  \def\theHchapter{\arabic{chapter}}
  \def\thesection{\@arabic\c@section}
  \def\theHsection{\arabic{section}}
}
\def\backmatter{%
  \cleardoublepage
  \setcounter{chapter}{0}
  \setcounter{section}{0}
  \setcounter{secnumdepth}{2}
  \def\@chapapp{\appendixname}%
  \def\thechapter{\@Alph\c@chapter}
  \def\theHchapter{\Alph{chapter}}
  \appendix
}
\newenvironment{bibitemlist}[1]{%
   \list{\@biblabel{\@arabic\c@enumiv}}%
       {\settowidth\labelwidth{\@biblabel{#1}}%
        \leftmargin\labelwidth
        \advance\leftmargin\labelsep
        \@openbib@code
        \usecounter{enumiv}%
        \let\p@enumiv\@empty
        \renewcommand\theenumiv{\@arabic\c@enumiv}%
	}%
  \sloppy
  \clubpenalty4000
  \@clubpenalty \clubpenalty
  \widowpenalty4000%
  \sfcode`\.\@m}%
  {\def\@noitemerr
    {\@latex@warning{Empty `bibitemlist' environment}}%
    \endlist}

\def\tableofcontents{\section*{\contentsname}\@starttoc{toc}}
\parskip0pt
\parindent1em
\def\Panel#1#2#3#4{\multicolumn{#3}{){\columncolor{#2}}#4}{#1}}
\newenvironment{reflist}{%
  \begin{raggedright}\begin{list}{}
  {%
   \setlength{\topsep}{0pt}%
   \setlength{\rightmargin}{0.25in}%
   \setlength{\itemsep}{0pt}%
   \setlength{\itemindent}{0pt}%
   \setlength{\parskip}{0pt}%
   \setlength{\parsep}{2pt}%
   \def\makelabel##1{\itshape ##1}}%
  }
  {\end{list}\end{raggedright}}
\newenvironment{sansreflist}{%
  \begin{raggedright}\begin{list}{}
  {%
   \setlength{\topsep}{0pt}%
   \setlength{\rightmargin}{0.25in}%
   \setlength{\itemindent}{0pt}%
   \setlength{\parskip}{0pt}%
   \setlength{\itemsep}{0pt}%
   \setlength{\parsep}{2pt}%
   \def\makelabel##1{\upshape ##1}}%
  }
  {\end{list}\end{raggedright}}
\newenvironment{specHead}[2]%
 {\vspace{20pt}\hrule\vspace{10pt}%
  \phantomsection\label{#1}\markright{#2}%

  \pdfbookmark[2]{#2}{#1}%
  \hspace{-0.75in}{\bfseries\fontsize{16pt}{18pt}\selectfont#2}%
  }{}
      \def\TheFullDate{2013-01-15 (revised: 15 January 2013)}
\def\TheID{\makeatother }
\def\TheDate{2013-01-15}
\title{Data Mining Approach to Prediction of Going Concern using Classification and Regression Tree (CART)}
\author{}\makeatletter 
\makeatletter
\newcommand*{\cleartoleftpage}{%
  \clearpage
    \if@twoside
    \ifodd\c@page
      \hbox{}\newpage
      \if@twocolumn
        \hbox{}\newpage
      \fi
    \fi
  \fi
}
\makeatother
\makeatletter
\thispagestyle{empty}
\markright{\@title}\markboth{\@title}{\@author}
\renewcommand\small{\@setfontsize\small{9pt}{11pt}\abovedisplayskip 8.5\p@ plus3\p@ minus4\p@
\belowdisplayskip \abovedisplayskip
\abovedisplayshortskip \z@ plus2\p@
\belowdisplayshortskip 4\p@ plus2\p@ minus2\p@
\def\@listi{\leftmargin\leftmargini
               \topsep 2\p@ plus1\p@ minus1\p@
               \parsep 2\p@ plus\p@ minus\p@
               \itemsep 1pt}
}
\makeatother
\fvset{frame=single,numberblanklines=false,xleftmargin=5mm,xrightmargin=5mm}
\fancyhf{} 
\setlength{\headheight}{14pt}
\fancyhead[LE]{\bfseries\leftmark} 
\fancyhead[RO]{\bfseries\rightmark} 
\fancyfoot[RO]{}
\fancyfoot[CO]{\thepage}
\fancyfoot[LO]{\TheID}
\fancyfoot[LE]{}
\fancyfoot[CE]{\thepage}
\fancyfoot[RE]{\TheID}
\hypersetup{citebordercolor=0.75 0.75 0.75,linkbordercolor=0.75 0.75 0.75,urlbordercolor=0.75 0.75 0.75,bookmarksnumbered=true}
\fancypagestyle{plain}{\fancyhead{}\renewcommand{\headrulewidth}{0pt}}

\date{}
\usepackage{authblk}

\providecommand{\keywords}[1]
{
\footnotesize
  \textbf{\textit{Index terms---}} #1
}

\usepackage{graphicx,xcolor}
\definecolor{GJBlue}{HTML}{273B81}
\definecolor{GJLightBlue}{HTML}{0A9DD9}
\definecolor{GJMediumGrey}{HTML}{6D6E70}
\definecolor{GJLightGrey}{HTML}{929497} 

\renewenvironment{abstract}{%
   \setlength{\parindent}{0pt}\raggedright
   \textcolor{GJMediumGrey}{\rule{\textwidth}{2pt}}
   \vskip16pt
   \textcolor{GJBlue}{\large\bfseries\abstractname\space}
}{%   
   \vskip8pt
   \textcolor{GJMediumGrey}{\rule{\textwidth}{2pt}}
   \vskip16pt
}

\usepackage[absolute,overlay]{textpos}

\makeatother 
      \usepackage{lineno}
      \linenumbers
      
\begin{document}

             \author[1]{Dr. Mahdi  Salehi}

             \author[2]{Dr. Mahdi  Salehi}

             \affil[1]{  Ferdowsi University of Mashhad}

\renewcommand\Authands{ and }

\date{\small \em Received: 10 December 2012 Accepted: 2 January 2013 Published: 15 January 2013}

\maketitle


\begin{abstract}
        

This paper has employed a data mining approach for Going Concern Prediction (GCP) for one year ahead and has applied Classification and Regression Tree (CART) and Naïve Bayes Bayesian Network (NBBN) based on feature selection method in Iranian firms listed in Tehran Stock Exchange (TSE). For this purpose, at the first step, using the Stepwise Discriminant Analysis (SDA) has opted the final variables from among of 42 variables and in the next stage, has applied 10-fold cross-validation to figure out the optimal model. McNemar test signifies that there is a significant difference between the two models in terms of prediction accuracy and CART model is able to predict going concern more accurately. The CART model reached 99.92 and 98.62 percent accuracy rates so as to training and holdout data.

\end{abstract}


\keywords{data mining, going concern prediction, classification and regression tree, naïve bayes bayesian network, financial ratios, iran.}

\begin{textblock*}{18cm}(1cm,1cm) % {block width} (coords) 
\textcolor{GJBlue}{\LARGE Global Journals \LaTeX\ JournalKaleidoscope\texttrademark}
\end{textblock*}

\begin{textblock*}{18cm}(1.4cm,1.5cm) % {block width} (coords) 
\textcolor{GJBlue}{\footnotesize \\ Artificial Intelligence formulated this projection for compatibility purposes from the original article published at Global Journals. However, this technology is currently in beta. \emph{Therefore, kindly ignore odd layouts, missed formulae, text, tables, or figures.}}
\end{textblock*}


\let\tabcellsep& 	 	 		 
\section[{Introduction}]{Introduction}\par
oing Concern Prediction (GCP) is an important element in investor's decision-making. Rapid advances in technology, vast environmental changes and increasing competition has affected the security of investment. On the other hand, based on the requirements of Statement on Auditing Standards (SAS) No.59 on every audit the auditor should evaluate whether substantial doubt exists about the firm's ability to continue as a going concern  {\ref (AICPA, 1988)}. However, SAS 59 contained the relevant criticized guidelines because of deeply subjective, general, ambiguous \hyperref[b7]{(Koh \& Killough 1988}) and, consequently, assessment of GCP sometimes is a tough process and the complexity of GCP has led the development of several models by employing a multiple financial and non-financial variables that might be signifying going concern opinion for auditor \hyperref[b11]{(Martens et al, 2008)}. Early studies of GCP developed by applying statistical techniques such as multiple discriminant analysis and Logit, probit \hyperref[b12]{(McKee, 1976;}\hyperref[b4]{Kida, 1980;}\hyperref[b5]{Koh, 1987;}\hyperref[b13]{Menon \& Schwartz, 1987;}\hyperref[b6]{Koh \& Brown, 1991)}. In recent years, data mining has established, developed and began to appear and grow promptly in the financial area and constructed a new approach for the deep research. Data mining technique via utilizing a large number financial data can be extracting, valuable and unknown knowledge dynamically. Using data mining techniques several research have been conducted in GCP area and the findings indicate that these techniques are able to predict the going concern status of firms and accounting data are useful in GCP \hyperref[b2]{(Brabazon \& Keenan, 2004;}\hyperref[b8]{Koh \& Kee Low, 2004;}\hyperref[b11]{Martens et al, 2008;}\hyperref[b14]{Mokhatab et al., 2011)}. Nowadays these methods because of the restrictive assumptions of statistical techniques (such as normality, linearity and independence of variables) are used less. This research has applied Classification and Regression Tree (CART) and Naïve Bayes Bayesian Network for GCP. Results from this study will help a manager to keep track of company's performance and to identify significant problems and take efficient measure to reduce the coincidence of failure. In addition, this model helps lenders and other stakeholders to have a clear and comprehensive picture of the firm's prospective status. In addition, auditor can use the survey results in the final stages of the audit engagement as a qualitycontrol device or as a benchmark in auditor judgment. Particularly, the GCP model in this paper can be applied for auditors to assess potential clients and as a means to identify non-going concern firms that might require further consideration. 
\section[{II.}]{II.} 
\section[{Research Development}]{Research Development}\par
The data set is composed of 146 Iranian manufacturing companies including 73 matched companies in bankrupt firms and firms with going concern status that all of them were or still are listed in the Tehran Stock Exchange (TSE) from 2001-2011. As you can see in Table \hyperref[tab_0]{1}, the 42 proposed variables used in this study are shown. After data collection, this paper applied process of future selection by T-test and Stepwise Discriminant Analysis (SDA) at a significant level of 0.05 and selected final variables. The potential advantages of feature selection are facilitating data visualization and understandable data, reducing the measurement and storage requirements \hyperref[b1]{(Ashoori \& Mohammadi, 2011)}. Another purpose of these tests is to determine the financial ratios that can distinguish between the two companies (going concern and nongoing concern status). The result of SDA process is shown in Table \hyperref[tab_1]{2}. The ratios that are entered in the model are total liabilities to total assets (?? 9 ), Retained earnings to total assets (?? 31 ), Operational income to sales (?? 36 ) and Net income to total assets (?? 34 ). After extraction of financial ratios, a model was constructed that explained as a discriminant model in below: Z= -0.374 X9+ 0.293 X31+ 0.359 X36+ 0.384 X34\par
(1)  CART, methodology was popularized in 80s by \hyperref[b3]{Breiman et al. (1984)}. In the area of GCP, the goal of the analysis via CART is to obtain a set of if-then rules with acceptable accuracy that determine what companies will have going concern or not in the future. Furthermore, reasons for selecting CART are that is nonparametric and can easily handle outliers. It is flexible and has an ability to adjust in time  {\ref (Timofeev 2004)}. In order to obtain the best predictive accuracy, CART is built to minimize the misclassification cost, which takes both variance, and misclassification rates into consideration. It is a significant step to choose the splits on the features that are employed to predict membership in corresponding class of firms. CART computational detail includes itself in finding the best split rules in order to make an uncomplicated, informative and accurate tree. The CART regards all variables as independent in the calculations of split with the training data set. The ??th samples is expressed as (?? 1 ?? , ?? 2 ?? , ?,?? ?? ?? , ?, ?? ?? ), where ?? ?? ?? is the value of the ??th sample firm on the ??th feature and the label value of the sample is ?? ?? . Since CART is a binary recursive partitioning method that every leaf of the data splits to two sub-leaves, for classification problem the values of ?? ?? are binary, e.g., -1 or 1. In the process of splitting, if a feature value ?? ?? ?? ? ?? ? is met, CART follows the rule that a sample goes right, otherwise it goes left. Split at each node will occur only when the split can go to greatest improvement in accuracy of prediction. Specific types of node impurity measure that \hyperref[b3]{Breiman et al. (1984)} proposed to apply Gini index as the criteria used in order to reduce the impurity in splitting for classification, since it can be estimated more rapidly and be readily extended to include symmetries costs can measure this. In the classification problem of GCP, the Gini index of impurity of a node can be signified as follows \hyperref[b3]{(Breiman et al., 1984)}:( ) 2 1 ? ? = j j gini c p I\par
Where ??(?? ?? ) indicates the relative frequency of the first class in the node. The Gini index reaches a value of zero when only one class is obtained at a node.It means that if all cases in a node belong to the same class, the Gini index will be zero \hyperref[b9]{(Li, Sun \& Wu, 2010)}. CART applied backward pruning algorithms. Pruning will be necessary to build smaller tree models that perform better on new data and not just on the training data. CART uses pruning and selecting in each node in the tree when the tree is fit \hyperref[b15]{(Soni, 2010)}. As the classification or regression tree is constructed, it can be used for classification of new data. The output of this stage is an assigned class or response value to each of the new observations. By set of questions in the tree, each of the new observations will get to one of the terminal nodes of the tree. A new observation is assigned with the dominating class/ response value of b) The Method of Naïve Bayes Bayesian Network (NBBN)\par
Bayes networks are a powerful tool for relationships between a set of variables and they are a suitable tool for dealing with uncertainty conditions in expert systems \hyperref[b10]{(Markov, 2007)}. The purpose of Bayes network is to establish a model that can classify companies correctly using financial ratios. A NBBN is based on Bayes' rule that is expressed as follows: In problem solving of going concern, P(A)??(??/??)= ??(??/??) ??(??) ??(??)\textbf{(2)}\par
shows the percentage of companies with going concern status and P(B) indicates the share of each of the independent variables are used for GCP and P(A/B) is probability of going concern status during one year ahead. An example of a NBBN can be seen in Figure \hyperref[fig_1]{1}. In this figure A is dependent variable and ?? 1 , ?? 2 , ?? 3 , and ?? 4 are independent variables \hyperref[b16]{(Sun \& Shenoy, 2007)}.  
\section[{Experimental Results}]{Experimental Results}\par
The proposed CART and NBBN models are implemented by using MATLAB 7.6.They are results from the 10 testing data sets by using 10-fold cross validation (See Table \hyperref[tab_2]{3} As shown in Table \hyperref[tab_4]{5}, the result of McNemar test at 5\% level indicates that there are significant differences between the two models in GCP. According to Table \hyperref[tab_5]{6}, Type I error is the probability that a company with non going concern status to be classified as a company with going concern status and Type II error is the probability that a company with going concern status to be classified as a company with non going concern status.\par
Costs related to these two types of errors are very different. Costs resulting from incorrectly classifying a company with non-going concern as a company with going concern status (Type I error) is much larger than the Type II error (incorrectly classifying a company with going concern as a company with non-going concern status). In holdout data type I and II error are also equal to 2.5 and 0 percent in CART model and 22.64 and 22.65 percent for obtained model by NBBN.  
\section[{Conclusion}]{Conclusion}\par
The current study demonstrated feasibility of applying CART and NBBN to predict going concern status with data collected from Iran. This paper considered a set of features that include 42 variables proposed in prior literature dealing with financial status prediction models in Iran and applied SDA to identify potential variables for GCP model and finally four financial ratios were selected and constructed CART and NBBN GCP models based on selected features. Based on the conclusions, the empirical tests show that CART and NBBN models have achieved 98.62 and 75.55 percent accuracy rates for training and holdout data, respectively. Moreover, McNemar's test results indicate that there are significant differences between the two models in predicting of going concern. In summary, obtained results from this research from 146 companies of Iran signify that: CART model has appropriate ability for GCP of firms. Further, this research empirically tested future selection using statistical technique that data mining algorithms can be used for future research.\begin{figure}[htbp]
\noindent\textbf{}\includegraphics[]{image-2.png}
\caption{\label{fig_0}D}\end{figure}
 \begin{figure}[htbp]
\noindent\textbf{1}\includegraphics[]{image-3.png}
\caption{\label{fig_1}Figure 1 :}\end{figure}
 \begin{figure}[htbp]
\noindent\textbf{1} \par 
\begin{longtable}{P{0.85\textwidth}}
2013\\
ear\\
Y\\
Volume XIII Issue III Version I\\
( )\\
Global Journal of Management and Business Research\end{longtable} \par
  {\small\itshape [Note: DData Mining Approach to Prediction of going Concern using Classification and Regression Tree (CART)]} 
\caption{\label{tab_0}Table 1 :}\end{figure}
 \begin{figure}[htbp]
\noindent\textbf{2} \par 
\begin{longtable}{P{0.16194556451612901\textwidth}P{0.06426411290322581\textwidth}P{0.12424395161290323\textwidth}P{0.04327116935483871\textwidth}P{0.04412802419354839\textwidth}P{0.05483870967741935\textwidth}P{0.07925907258064516\textwidth}P{0.1349546370967742\textwidth}P{0.05912298387096773\textwidth}P{0.04412802419354839\textwidth}P{0.03984375\textwidth}}
\#\tabcellsep \multicolumn{2}{l}{Definition of variables}\tabcellsep Means of Group 1\tabcellsep Means of Group 0\tabcellsep Sig level\tabcellsep \#\tabcellsep Definition of variables\tabcellsep Means of Group 1\tabcellsep Means of Group 0\tabcellsep Sig level\\
1\tabcellsep EBIT/TA\tabcellsep \tabcellsep 0.18\tabcellsep 0.05\tabcellsep 0.00\tabcellsep 2\tabcellsep LTD/SE\tabcellsep 0.20\tabcellsep 0.56\tabcellsep 0.06\\
3\tabcellsep RE/SC\tabcellsep \tabcellsep 0.65\tabcellsep 0.02\tabcellsep 0.00\tabcellsep 4\tabcellsep MVE/TL\tabcellsep 1.40\tabcellsep 0.66\tabcellsep 0.00\\
5\tabcellsep MVE/SE\tabcellsep \tabcellsep 2.42\tabcellsep 2.57\tabcellsep 0.22\tabcellsep 6\tabcellsep MVE/TA\tabcellsep 0.77\tabcellsep 0.48\tabcellsep 0.00\\
7\tabcellsep Ca/TA\tabcellsep \tabcellsep 0.05\tabcellsep 0.03\tabcellsep 0.00\tabcellsep 8\tabcellsep Size(logTA)\tabcellsep 5.25\tabcellsep 5.23\tabcellsep 0.83\\
9\tabcellsep TL/TA*\tabcellsep \tabcellsep 0.67\tabcellsep 0.80\tabcellsep 0.00\tabcellsep \multicolumn{2}{l}{10 CL/SE}\tabcellsep 2.27\tabcellsep 4.76\tabcellsep 0.00\\
11\tabcellsep CL/TL\tabcellsep \tabcellsep 0.86\tabcellsep 0.85\tabcellsep 0.94\tabcellsep \multicolumn{2}{l}{12 (Ca+STI)/CL}\tabcellsep 0.11\tabcellsep 0.05\tabcellsep 0.00\\
13\tabcellsep \multicolumn{2}{l}{(R+Inv)/TA}\tabcellsep 0.57\tabcellsep 0.57\tabcellsep 0.88\tabcellsep \multicolumn{2}{l}{14 R/S}\tabcellsep 0.53\tabcellsep 0.40\tabcellsep 0.10\\
15\tabcellsep R/Inv\tabcellsep \tabcellsep 1.18\tabcellsep 1.00\tabcellsep 0.93\tabcellsep \multicolumn{2}{l}{16 SE/TL}\tabcellsep 0.63\tabcellsep 0.32\tabcellsep 0.00\\
17\tabcellsep SE/TA\tabcellsep \tabcellsep 0.35\tabcellsep 0.22\tabcellsep 0.00\tabcellsep \multicolumn{2}{l}{18 CA/CL}\tabcellsep 1.31\tabcellsep 1.07\tabcellsep 0.00\\
19\tabcellsep QA/CL\tabcellsep \tabcellsep 0.70\tabcellsep 0.57\tabcellsep 0.00\tabcellsep \multicolumn{2}{l}{20 QA/TA}\tabcellsep 0.37\tabcellsep 0.36\tabcellsep 0.73\\
21\tabcellsep \multicolumn{2}{l}{FA/(SE+LTD)}\tabcellsep 0.60\tabcellsep 0.91\tabcellsep 0.01\tabcellsep \multicolumn{2}{l}{22 FA/TA}\tabcellsep 0.22\tabcellsep 0.24\tabcellsep 0.63\\
23\tabcellsep CA/TA\tabcellsep \tabcellsep 0.70\tabcellsep 0.68\tabcellsep 0.66\tabcellsep \multicolumn{2}{l}{24 Ca/CL}\tabcellsep 0.09\tabcellsep 0.04\tabcellsep 0.00\\
25\tabcellsep IE/GP\tabcellsep \tabcellsep -0.02\tabcellsep -1.21\tabcellsep 0.48\tabcellsep \multicolumn{2}{l}{26 S/Ca}\tabcellsep 35.30\tabcellsep 44.80\tabcellsep 0.11\\
27\tabcellsep S/TA\tabcellsep \tabcellsep 0.93\tabcellsep 0.70\tabcellsep 0.00\tabcellsep \multicolumn{2}{l}{28 WC/TA}\tabcellsep 0.13\tabcellsep 0.00\tabcellsep 0.00\\
29\tabcellsep PIC/SE\tabcellsep \tabcellsep 0.53\tabcellsep 0.86\tabcellsep 0.00\tabcellsep \multicolumn{2}{l}{30 S/WC}\tabcellsep 2.87\tabcellsep 1.73\tabcellsep 0.96\\
31\tabcellsep RE/TA*\tabcellsep \tabcellsep 0.08\tabcellsep -0.03\tabcellsep 0.00\tabcellsep \multicolumn{2}{l}{32 NI/SE}\tabcellsep 0.42\tabcellsep -0.03\tabcellsep 0.00\\
33\tabcellsep NI/S\tabcellsep \tabcellsep 0.16\tabcellsep -0.02\tabcellsep 0.00\tabcellsep \multicolumn{2}{l}{34 NI/TA*}\tabcellsep 0.13\tabcellsep 0.00\tabcellsep 0.00\\
35\tabcellsep S/CA\tabcellsep \tabcellsep 1.34\tabcellsep 1.07\tabcellsep 0.00\tabcellsep \multicolumn{2}{l}{36 OI/S*}\tabcellsep 0.20\tabcellsep 0.06\tabcellsep 0.00\\
37\tabcellsep OI/TA\tabcellsep \tabcellsep 0.17\tabcellsep 0.03\tabcellsep 0.00\tabcellsep \multicolumn{2}{l}{38 EBIT/IE}\tabcellsep -5.21\tabcellsep -0.45\tabcellsep 0.05\\
39\tabcellsep EBIT/S\tabcellsep \tabcellsep 0.52\tabcellsep 0.10\tabcellsep 0.00\tabcellsep \multicolumn{2}{l}{40 GP/S}\tabcellsep 0.27\tabcellsep 0.15\tabcellsep 0.00\\
41\tabcellsep S/SE\tabcellsep \tabcellsep 3.32\tabcellsep 4.68\tabcellsep 0.05\tabcellsep \multicolumn{2}{l}{42 S/FA}\tabcellsep 6.29\tabcellsep 6.44\tabcellsep 0.33\\
\multicolumn{8}{l}{Group 1: going concern firms and Group 0: non-going concern firms}\tabcellsep \tabcellsep \\
\multicolumn{4}{l}{* : Final variables selected by SDA}\tabcellsep \tabcellsep \tabcellsep \tabcellsep \tabcellsep \tabcellsep \\
\multicolumn{3}{l}{CA: Current assets}\tabcellsep \tabcellsep \tabcellsep \tabcellsep \tabcellsep \multicolumn{2}{l}{NI: Net income}\tabcellsep \\
\multicolumn{2}{l}{Ca: Cash}\tabcellsep \tabcellsep \tabcellsep \tabcellsep \tabcellsep \tabcellsep \multicolumn{3}{l}{OI: Operational income}\\
\multicolumn{3}{l}{CL: Current liabilities}\tabcellsep \tabcellsep \tabcellsep \tabcellsep \tabcellsep \multicolumn{3}{l}{QA: Quick assets}\\
\multicolumn{3}{l}{PIC: Paid in capital}\tabcellsep \tabcellsep \tabcellsep \tabcellsep \tabcellsep \multicolumn{2}{l}{R: Receivables}\tabcellsep \\
\multicolumn{5}{l}{EBIT: Earnings before interest \& taxes}\tabcellsep \tabcellsep \tabcellsep \multicolumn{3}{l}{RE: Retained earnings}\\
\multicolumn{2}{l}{FA: Fixed assets}\tabcellsep \tabcellsep \tabcellsep \tabcellsep \tabcellsep \tabcellsep \multicolumn{2}{l}{S: Sales}\tabcellsep \\
\multicolumn{2}{l}{GP: Gross profit}\tabcellsep \tabcellsep \tabcellsep \tabcellsep \tabcellsep \tabcellsep \multicolumn{3}{l}{SC: Stock capital}\\
\multicolumn{3}{l}{IE: Interest expenses}\tabcellsep \tabcellsep \tabcellsep \tabcellsep \tabcellsep \multicolumn{3}{l}{SE: Shareholders' equity}\\
\multicolumn{2}{l}{Inv: Inventory}\tabcellsep \tabcellsep \tabcellsep \tabcellsep \tabcellsep \tabcellsep \multicolumn{3}{l}{STI: Short term investments}\\
\multicolumn{3}{l}{LA : Liquid assets}\tabcellsep \tabcellsep \tabcellsep \tabcellsep \tabcellsep \multicolumn{2}{l}{TA: Total assets}\tabcellsep \\
\multicolumn{3}{l}{LTD: Long term debt}\tabcellsep \tabcellsep \tabcellsep \tabcellsep \tabcellsep \multicolumn{3}{l}{TL: Total liabilities}\\
\multicolumn{4}{l}{MVE: Marked value of equity}\tabcellsep \tabcellsep \tabcellsep \tabcellsep \multicolumn{3}{l}{WC: Working capital}\\
\tabcellsep Step\tabcellsep \tabcellsep \tabcellsep \tabcellsep \multicolumn{5}{l}{Tolerance F to Remove Wilks' Lambda}\\
\tabcellsep 1\tabcellsep \multicolumn{3}{l}{Net income to total assets}\tabcellsep \tabcellsep 1.00\tabcellsep 100.77\tabcellsep \tabcellsep \\
\tabcellsep 2\tabcellsep \multicolumn{3}{l}{Net income to total assets}\tabcellsep \tabcellsep 0.94\tabcellsep 56.24\tabcellsep \multicolumn{2}{l}{0.75}\\
\tabcellsep \tabcellsep \multicolumn{3}{l}{Total liabilities to total assets}\tabcellsep \tabcellsep 0.94\tabcellsep 9.07\tabcellsep \multicolumn{2}{l}{0.55}\\
\tabcellsep 3\tabcellsep \multicolumn{3}{l}{Net income to total assets}\tabcellsep \tabcellsep 0.51\tabcellsep 8.62\tabcellsep \multicolumn{2}{l}{0.52}\\
\tabcellsep \tabcellsep \multicolumn{3}{l}{Total liabilities to total assets}\tabcellsep \tabcellsep 0.91\tabcellsep 11.10\tabcellsep \multicolumn{2}{l}{0.53}\\
\tabcellsep \tabcellsep \multicolumn{3}{l}{Operational income to sales}\tabcellsep \tabcellsep 0.55\tabcellsep 6.11\tabcellsep \multicolumn{2}{l}{0.51}\\
\tabcellsep 4\tabcellsep \multicolumn{3}{l}{Net income to total assets}\tabcellsep \tabcellsep 0.48\tabcellsep 4.75\tabcellsep \multicolumn{2}{l}{0.49}\\
\tabcellsep \tabcellsep \multicolumn{3}{l}{Total liabilities to total assets}\tabcellsep \tabcellsep 0.90\tabcellsep 8.55\tabcellsep \multicolumn{2}{l}{0.50}\\
\tabcellsep \tabcellsep \multicolumn{3}{l}{Operational income to sales}\tabcellsep \tabcellsep 0.54\tabcellsep 4.57\tabcellsep \multicolumn{2}{l}{0.49}\\
\tabcellsep \tabcellsep \multicolumn{4}{l}{Retained earnings to total assets}\tabcellsep 0.77\tabcellsep 4.37\tabcellsep \multicolumn{2}{l}{0.49}\end{longtable} \par
 
\caption{\label{tab_1}Table 2 :}\end{figure}
 \begin{figure}[htbp]
\noindent\textbf{3} \par 
\begin{longtable}{P{0.07623318385650224\textwidth}P{0.21917040358744397\textwidth}P{0.1867713004484305\textwidth}P{0.20011210762331838\textwidth}P{0.16771300448430493\textwidth}}
\tabcellsep \multicolumn{3}{l}{and NBBN model}\tabcellsep \\
\tabcellsep \multicolumn{2}{l}{CART}\tabcellsep \multicolumn{2}{l}{NBBN}\\
Fold\tabcellsep Training\tabcellsep Hold-out\tabcellsep Training\tabcellsep Hold-out\\
\tabcellsep data\tabcellsep data\tabcellsep data\tabcellsep data\\
1\tabcellsep 100.00\tabcellsep 100.00\tabcellsep 100.00\tabcellsep 80.00\\
2\tabcellsep 100.00\tabcellsep 100.00\tabcellsep 100.00\tabcellsep 80.00\\
3\tabcellsep 100.00\tabcellsep 100.00\tabcellsep 100.00\tabcellsep 66.67\\
4\tabcellsep 93.33\tabcellsep 99.23\tabcellsep 100.00\tabcellsep 66.67\\
5\tabcellsep 100.00\tabcellsep 100.00\tabcellsep 100.00\tabcellsep 80.00\\
6\tabcellsep 92.86\tabcellsep 100.00\tabcellsep 100.00\tabcellsep 85.71\\
7\tabcellsep 100.00\tabcellsep 100.00\tabcellsep 100.00\tabcellsep 64.29\\
8\tabcellsep 100.00\tabcellsep 100.00\tabcellsep 100.00\tabcellsep 78.57\\
9\tabcellsep 100.00\tabcellsep 100.00\tabcellsep 100.00\tabcellsep 82.21\\
10\tabcellsep 100.00\tabcellsep 100.00\tabcellsep 100.00\tabcellsep 71.43\\
Min\tabcellsep 92.86\tabcellsep 99.23\tabcellsep 100.00\tabcellsep 64.29\\
Max\tabcellsep 100.00\tabcellsep 100.00\tabcellsep 100.00\tabcellsep 85.71\\
Median Variance\tabcellsep 100.00 9.28\tabcellsep 100.00 0.07\tabcellsep 100.00 0.00\tabcellsep 85.71 61.99\\
Mean\tabcellsep 98.62\tabcellsep 99.92\tabcellsep 100.00\tabcellsep 75.55\end{longtable} \par
 
\caption{\label{tab_2}Table 3 :}\end{figure}
 \begin{figure}[htbp]
\noindent\textbf{4} \par 
\begin{longtable}{P{0.23181818181818178\textwidth}P{0.29363636363636364\textwidth}P{0.3245454545454545\textwidth}}
Fold\tabcellsep Cont Rule\tabcellsep Height Tree\\
1\tabcellsep 3\tabcellsep 2\\
2\tabcellsep 3\tabcellsep 2\\
3\tabcellsep 3\tabcellsep 2\\
4\tabcellsep 2\tabcellsep 1\\
5\tabcellsep 3\tabcellsep 2\\
6\tabcellsep 2\tabcellsep 1\\
7\tabcellsep 3\tabcellsep 2\\
8\tabcellsep 3\tabcellsep 2\\
9\tabcellsep 3\tabcellsep 2\\
10\tabcellsep 3\tabcellsep 2\end{longtable} \par
 
\caption{\label{tab_3}Table 4 :}\end{figure}
 \begin{figure}[htbp]
\noindent\textbf{5} \par 
\begin{longtable}{P{0.4533333333333333\textwidth}P{0.39666666666666667\textwidth}}
\multicolumn{2}{l}{Methods NBBN}\\
CART\tabcellsep -3.536 (0.011)\end{longtable} \par
  {\small\itshape [Note: D]} 
\caption{\label{tab_4}Table 5 :}\end{figure}
 \begin{figure}[htbp]
\noindent\textbf{6} \par 
\begin{longtable}{P{0.07456140350877193\textwidth}P{0.4399122807017544\textwidth}P{0.3355263157894737\textwidth}}
\tabcellsep \multicolumn{2}{l}{Real status}\\
Prediction\tabcellsep Non going\tabcellsep Going concern\\
\tabcellsep concern status\tabcellsep status\\
\tabcellsep 1-P 22 (Type I error)\tabcellsep P 11\\
\tabcellsep P 22\tabcellsep 1-P 11 (Type II error)\end{longtable} \par
 
\caption{\label{tab_5}Table 6 :}\end{figure}
 			\footnote{© 2013 Global Journals Inc. (US)} 		 		\backmatter  			  				\begin{bibitemlist}{1}
\bibitem[Brabazon and Keenan ()]{b2}\label{b2} 	 		‘A hybrid genetic model for the prediction of corporate failure’.  		 			A Brabazon 		,  		 			B Keenan 		.  	 	 		\textit{Computational Management Science}  		2004. Springer-Verlag. p. .  	 
\bibitem[Menon and Schwartz ()]{b13}\label{b13} 	 		‘An empirical investigation of audit qualification decisions in the presence of going concern uncertainties’.  		 			K Menon 		,  		 			K Schwartz 		.  	 	 		\textit{Contemporary Accounting Research}  		1987. 3  (2)  p. .  	 
\bibitem[Kida ()]{b4}\label{b4} 	 		‘An investigation into auditors, continuity and related qualification judgments’.  		 			T Kida 		.  	 	 		\textit{Journal of Accounting Research}  		1980. 18  (2)  p. .  	 
\bibitem[Breiman et al. ()]{b3}\label{b3} 	 		\textit{Classification and regression trees},  		 			L Breiman 		,  		 			J Friedman 		,  		 			R Olshen 		,  		 			C Stone 		.  		1984.  	 	 (International Group) 
\bibitem[Ashoori and Mohammadi ()]{b1}\label{b1} 	 		‘Compare failure prediction models based on feature selection technique: empirical case from Iran’.  		 			S Ashoori 		,  		 			S Mohammadi 		.  	 	 		\textit{Procedia Computer Science}  		2011. 3 p. .  	 
\bibitem[Mckee ()]{b12}\label{b12} 	 		‘Discriminant prediction of going concern status: A model for auditors’.  		 			T Mckee 		.  	 	 		\textit{Selected Papers of the AAA Annual Meeting},  				1976.  	 
\bibitem[Mokhatab Rafiei et al. ()]{b14}\label{b14} 	 		‘Financial health prediction models using artificial neural networks, genetic algorithm and multivariate discriminant analysis: Iranian evidence’.  		 			F Mokhatab Rafiei 		,  		 			S M Manzari 		,  		 			S Bostanian 		.  	 	 		\textit{Expert Systems with Applications}  		2011. 38 p. .  	 
\bibitem[Koh and Kee Low ()]{b8}\label{b8} 	 		‘Going concern prediction using data mining techniques’.  		 			H C Koh 		,  		 			C Kee Low 		.  	 	 		\textit{Managerial Auditing Journal}  		2004. 19  (3)  p. .  	 
\bibitem[Soni ()]{b15}\label{b15} 	 		‘Implementation of multivariate data set by CART algorithm’.  		 			S Soni 		.  	 	 		\textit{Journal of Information Technology and Knowledge Management}  		2010. 2  (2)  p. .  	 
\bibitem[Li et al. ()]{b9}\label{b9} 	 		‘Predicting business failure using classification and regression tree: An empirical comparison with popular classical statistical methods and top classification mining methods’.  		 			H Li 		,  		 			J Sun 		,  		 			J Wu 		.  	 	 		\textit{Expert Systems with Applications}  		2010. 37 p. .  	 
\bibitem[Martens et al. ()]{b11}\label{b11} 	 		‘Predicting going concern opinion with data mining’.  		 			D Martens 		,  		 			L Bruyneseels 		,  		 			B Baesens 		,  		 			M Willekens 		,  		 			J Vanthienen 		.  	 	 		\textit{Decision Support Systems}  		2008. 45 p. .  	 
\bibitem[Koh ()]{b5}\label{b5} 	 		\textit{Prediction of going-concern status: A probit model for the auditors},  		 			H Koh 		.  		1987.  		 			Virginia Polytechnic Institute and State University 		 	 	 (Ph.D. dissertation) 
\bibitem[Markov ()]{b10}\label{b10} 	 		\textit{Probabilistic reasoning with naïve bayes and Bayesian networks, PhD dissertation},  		 			Z Markov 		.  		2007.  		 			Central Connecticut State University 		 	 
\bibitem[Koh and Brown ()]{b6}\label{b6} 	 		‘Probit prediction of going and non-going concerns’.  		 			H Koh 		,  		 			R Brown 		.  	 	 		\textit{Managerial Auditing Journal}  		1991. 6  (3)  p. .  	 
\bibitem[Koh and Killough ()]{b7}\label{b7} 	 		‘Proposed statement on auditing standards: the auditor's consideration of an entity's ability to continue existence’.  		 			H C Koh 		,  		 			L N Killough 		.  	 	 		\textit{Virginia Accountant Quarterly}  		1988. 40  (2)  p. .  	 
\bibitem[
			Aicpa
		 ()]{b0}\label{b0} 	 		‘The auditor's consideration of an entity's ability to continue in existence’.  		 			Aicpa 		.  	 	 		\textit{Statement on auditing standards},  				1998.  	 
\bibitem[Sun and Shenoy ()]{b16}\label{b16} 	 		\textit{Using Bayesian Networks for Bankruptcy Prediction: Some},  		 			L Sun 		,  		 			P Shenoy 		.  		2007.  	 
\end{bibitemlist}
 			 		 	 
\end{document}