\documentclass[11pt,twoside]{article}\makeatletter

\IfFileExists{xcolor.sty}%
  {\RequirePackage{xcolor}}%
  {\RequirePackage{color}}
\usepackage{colortbl}
\usepackage{wrapfig}
\usepackage{ifxetex}
\ifxetex
  \usepackage{fontspec}
  \usepackage{xunicode}
  \catcode`⃥=\active \def⃥{\textbackslash}
  \catcode`❴=\active \def❴{\{}
  \catcode`❵=\active \def❵{\}}
  \def\textJapanese{\fontspec{Noto Sans CJK JP}}
  \def\textChinese{\fontspec{Noto Sans CJK SC}}
  \def\textKorean{\fontspec{Noto Sans CJK KR}}
  \setmonofont{DejaVu Sans Mono}
  
\else
  \IfFileExists{utf8x.def}%
   {\usepackage[utf8x]{inputenc}
      \PrerenderUnicode{–}
    }%
   {\usepackage[utf8]{inputenc}}
  \usepackage[english]{babel}
  \usepackage[T1]{fontenc}
  \usepackage{float}
  \usepackage[]{ucs}
  \uc@dclc{8421}{default}{\textbackslash }
  \uc@dclc{10100}{default}{\{}
  \uc@dclc{10101}{default}{\}}
  \uc@dclc{8491}{default}{\AA{}}
  \uc@dclc{8239}{default}{\,}
  \uc@dclc{20154}{default}{ }
  \uc@dclc{10148}{default}{>}
  \def\textschwa{\rotatebox{-90}{e}}
  \def\textJapanese{}
  \def\textChinese{}
  \IfFileExists{tipa.sty}{\usepackage{tipa}}{}
\fi
\def\exampleFont{\ttfamily\small}
\DeclareTextSymbol{\textpi}{OML}{25}
\usepackage{relsize}
\RequirePackage{array}
\def\@testpach{\@chclass
 \ifnum \@lastchclass=6 \@ne \@chnum \@ne \else
  \ifnum \@lastchclass=7 5 \else
   \ifnum \@lastchclass=8 \tw@ \else
    \ifnum \@lastchclass=9 \thr@@
   \else \z@
   \ifnum \@lastchclass = 10 \else
   \edef\@nextchar{\expandafter\string\@nextchar}%
   \@chnum
   \if \@nextchar c\z@ \else
    \if \@nextchar l\@ne \else
     \if \@nextchar r\tw@ \else
   \z@ \@chclass
   \if\@nextchar |\@ne \else
    \if \@nextchar !6 \else
     \if \@nextchar @7 \else
      \if \@nextchar (8 \else
       \if \@nextchar )9 \else
  10
  \@chnum
  \if \@nextchar m\thr@@\else
   \if \@nextchar p4 \else
    \if \@nextchar b5 \else
   \z@ \@chclass \z@ \@preamerr \z@ \fi \fi \fi \fi
   \fi \fi  \fi  \fi  \fi  \fi  \fi \fi \fi \fi \fi \fi}
\gdef\arraybackslash{\let\\=\@arraycr}
\def\@textsubscript#1{{\m@th\ensuremath{_{\mbox{\fontsize\sf@size\z@#1}}}}}
\def\Panel#1#2#3#4{\multicolumn{#3}{){\columncolor{#2}}#4}{#1}}
\def\abbr{}
\def\corr{}
\def\expan{}
\def\gap{}
\def\orig{}
\def\reg{}
\def\ref{}
\def\sic{}
\def\persName{}\def\name{}
\def\placeName{}
\def\orgName{}
\def\textcal#1{{\fontspec{Lucida Calligraphy}#1}}
\def\textgothic#1{{\fontspec{Lucida Blackletter}#1}}
\def\textlarge#1{{\large #1}}
\def\textoverbar#1{\ensuremath{\overline{#1}}}
\def\textquoted#1{‘#1’}
\def\textsmall#1{{\small #1}}
\def\textsubscript#1{\@textsubscript{\selectfont#1}}
\def\textxi{\ensuremath{\xi}}
\def\titlem{\itshape}
\newenvironment{biblfree}{}{\ifvmode\par\fi }
\newenvironment{bibl}{}{}
\newenvironment{byline}{\vskip6pt\itshape\fontsize{16pt}{18pt}\selectfont}{\par }
\newenvironment{citbibl}{}{\ifvmode\par\fi }
\newenvironment{docAuthor}{\ifvmode\vskip4pt\fontsize{16pt}{18pt}\selectfont\fi\itshape}{\ifvmode\par\fi }
\newenvironment{docDate}{}{\ifvmode\par\fi }
\newenvironment{docImprint}{\vskip 6pt}{\ifvmode\par\fi }
\newenvironment{docTitle}{\vskip6pt\bfseries\fontsize{22pt}{25pt}\selectfont}{\par }
\newenvironment{msHead}{\vskip 6pt}{\par}
\newenvironment{msItem}{\vskip 6pt}{\par}
\newenvironment{rubric}{}{}
\newenvironment{titlePart}{}{\par }

\newcolumntype{L}[1]{){\raggedright\arraybackslash}p{#1}}
\newcolumntype{C}[1]{){\centering\arraybackslash}p{#1}}
\newcolumntype{R}[1]{){\raggedleft\arraybackslash}p{#1}}
\newcolumntype{P}[1]{){\arraybackslash}p{#1}}
\newcolumntype{B}[1]{){\arraybackslash}b{#1}}
\newcolumntype{M}[1]{){\arraybackslash}m{#1}}
\definecolor{label}{gray}{0.75}
\def\unusedattribute#1{\sout{\textcolor{label}{#1}}}
\DeclareRobustCommand*{\xref}{\hyper@normalise\xref@}
\def\xref@#1#2{\hyper@linkurl{#2}{#1}}
\begingroup
\catcode`\_=\active
\gdef_#1{\ensuremath{\sb{\mathrm{#1}}}}
\endgroup
\mathcode`\_=\string"8000
\catcode`\_=12\relax

\usepackage[a4paper,twoside,lmargin=1in,rmargin=1in,tmargin=1in,bmargin=1in,marginparwidth=0.75in]{geometry}
\usepackage{framed}

\definecolor{shadecolor}{gray}{0.95}
\usepackage{longtable}
\usepackage[normalem]{ulem}
\usepackage{fancyvrb}
\usepackage{fancyhdr}
\usepackage{graphicx}
\usepackage{marginnote}

\renewcommand{\@cite}[1]{#1}


\renewcommand*{\marginfont}{\itshape\footnotesize}

\def\Gin@extensions{.pdf,.png,.jpg,.mps,.tif}

  \pagestyle{fancy}

\usepackage[pdftitle={Data Preprocessing in Multi-Temporal Remote Sensing Data for Deforestation Analysis},
 pdfauthor={}]{hyperref}
\hyperbaseurl{}

	 \paperwidth210mm
	 \paperheight297mm
              
\def\@pnumwidth{1.55em}
\def\@tocrmarg {2.55em}
\def\@dotsep{4.5}
\setcounter{tocdepth}{3}
\clubpenalty=8000
\emergencystretch 3em
\hbadness=4000
\hyphenpenalty=400
\pretolerance=750
\tolerance=2000
\vbadness=4000
\widowpenalty=10000

\renewcommand\section{\@startsection {section}{1}{\z@}%
     {-1.75ex \@plus -0.5ex \@minus -.2ex}%
     {0.5ex \@plus .2ex}%
     {\reset@font\Large\bfseries}}
\renewcommand\subsection{\@startsection{subsection}{2}{\z@}%
     {-1.75ex\@plus -0.5ex \@minus- .2ex}%
     {0.5ex \@plus .2ex}%
     {\reset@font\Large}}
\renewcommand\subsubsection{\@startsection{subsubsection}{3}{\z@}%
     {-1.5ex\@plus -0.35ex \@minus -.2ex}%
     {0.5ex \@plus .2ex}%
     {\reset@font\large}}
\renewcommand\paragraph{\@startsection{paragraph}{4}{\z@}%
     {-1ex \@plus-0.35ex \@minus -0.2ex}%
     {0.5ex \@plus .2ex}%
     {\reset@font\normalsize}}
\renewcommand\subparagraph{\@startsection{subparagraph}{5}{\parindent}%
     {1.5ex \@plus1ex \@minus .2ex}%
     {-1em}%
     {\reset@font\normalsize\bfseries}}


\def\l@section#1#2{\addpenalty{\@secpenalty} \addvspace{1.0em plus 1pt}
 \@tempdima 1.5em \begingroup
 \parindent \z@ \rightskip \@pnumwidth 
 \parfillskip -\@pnumwidth 
 \bfseries \leavevmode #1\hfil \hbox to\@pnumwidth{\hss #2}\par
 \endgroup}
\def\l@subsection{\@dottedtocline{2}{1.5em}{2.3em}}
\def\l@subsubsection{\@dottedtocline{3}{3.8em}{3.2em}}
\def\l@paragraph{\@dottedtocline{4}{7.0em}{4.1em}}
\def\l@subparagraph{\@dottedtocline{5}{10em}{5em}}
\@ifundefined{c@section}{\newcounter{section}}{}
\@ifundefined{c@chapter}{\newcounter{chapter}}{}
\newif\if@mainmatter 
\@mainmattertrue
\def\chaptername{Chapter}
\def\frontmatter{%
  \pagenumbering{roman}
  \def\thechapter{\@roman\c@chapter}
  \def\theHchapter{\roman{chapter}}
  \def\thesection{\@roman\c@section}
  \def\theHsection{\roman{section}}
  \def\@chapapp{}%
}
\def\mainmatter{%
  \cleardoublepage
  \def\thechapter{\@arabic\c@chapter}
  \setcounter{chapter}{0}
  \setcounter{section}{0}
  \pagenumbering{arabic}
  \setcounter{secnumdepth}{6}
  \def\@chapapp{\chaptername}%
  \def\theHchapter{\arabic{chapter}}
  \def\thesection{\@arabic\c@section}
  \def\theHsection{\arabic{section}}
}
\def\backmatter{%
  \cleardoublepage
  \setcounter{chapter}{0}
  \setcounter{section}{0}
  \setcounter{secnumdepth}{2}
  \def\@chapapp{\appendixname}%
  \def\thechapter{\@Alph\c@chapter}
  \def\theHchapter{\Alph{chapter}}
  \appendix
}
\newenvironment{bibitemlist}[1]{%
   \list{\@biblabel{\@arabic\c@enumiv}}%
       {\settowidth\labelwidth{\@biblabel{#1}}%
        \leftmargin\labelwidth
        \advance\leftmargin\labelsep
        \@openbib@code
        \usecounter{enumiv}%
        \let\p@enumiv\@empty
        \renewcommand\theenumiv{\@arabic\c@enumiv}%
	}%
  \sloppy
  \clubpenalty4000
  \@clubpenalty \clubpenalty
  \widowpenalty4000%
  \sfcode`\.\@m}%
  {\def\@noitemerr
    {\@latex@warning{Empty `bibitemlist' environment}}%
    \endlist}

\def\tableofcontents{\section*{\contentsname}\@starttoc{toc}}
\parskip0pt
\parindent1em
\def\Panel#1#2#3#4{\multicolumn{#3}{){\columncolor{#2}}#4}{#1}}
\newenvironment{reflist}{%
  \begin{raggedright}\begin{list}{}
  {%
   \setlength{\topsep}{0pt}%
   \setlength{\rightmargin}{0.25in}%
   \setlength{\itemsep}{0pt}%
   \setlength{\itemindent}{0pt}%
   \setlength{\parskip}{0pt}%
   \setlength{\parsep}{2pt}%
   \def\makelabel##1{\itshape ##1}}%
  }
  {\end{list}\end{raggedright}}
\newenvironment{sansreflist}{%
  \begin{raggedright}\begin{list}{}
  {%
   \setlength{\topsep}{0pt}%
   \setlength{\rightmargin}{0.25in}%
   \setlength{\itemindent}{0pt}%
   \setlength{\parskip}{0pt}%
   \setlength{\itemsep}{0pt}%
   \setlength{\parsep}{2pt}%
   \def\makelabel##1{\upshape ##1}}%
  }
  {\end{list}\end{raggedright}}
\newenvironment{specHead}[2]%
 {\vspace{20pt}\hrule\vspace{10pt}%
  \phantomsection\label{#1}\markright{#2}%

  \pdfbookmark[2]{#2}{#1}%
  \hspace{-0.75in}{\bfseries\fontsize{16pt}{18pt}\selectfont#2}%
  }{}
      \def\TheFullDate{2013-01-15 (revised: 15 January 2013)}
\def\TheID{\makeatother }
\def\TheDate{2013-01-15}
\title{Data Preprocessing in Multi-Temporal Remote Sensing Data for Deforestation Analysis}
\author{}\makeatletter 
\makeatletter
\newcommand*{\cleartoleftpage}{%
  \clearpage
    \if@twoside
    \ifodd\c@page
      \hbox{}\newpage
      \if@twocolumn
        \hbox{}\newpage
      \fi
    \fi
  \fi
}
\makeatother
\makeatletter
\thispagestyle{empty}
\markright{\@title}\markboth{\@title}{\@author}
\renewcommand\small{\@setfontsize\small{9pt}{11pt}\abovedisplayskip 8.5\p@ plus3\p@ minus4\p@
\belowdisplayskip \abovedisplayskip
\abovedisplayshortskip \z@ plus2\p@
\belowdisplayshortskip 4\p@ plus2\p@ minus2\p@
\def\@listi{\leftmargin\leftmargini
               \topsep 2\p@ plus1\p@ minus1\p@
               \parsep 2\p@ plus\p@ minus\p@
               \itemsep 1pt}
}
\makeatother
\fvset{frame=single,numberblanklines=false,xleftmargin=5mm,xrightmargin=5mm}
\fancyhf{} 
\setlength{\headheight}{14pt}
\fancyhead[LE]{\bfseries\leftmark} 
\fancyhead[RO]{\bfseries\rightmark} 
\fancyfoot[RO]{}
\fancyfoot[CO]{\thepage}
\fancyfoot[LO]{\TheID}
\fancyfoot[LE]{}
\fancyfoot[CE]{\thepage}
\fancyfoot[RE]{\TheID}
\hypersetup{citebordercolor=0.75 0.75 0.75,linkbordercolor=0.75 0.75 0.75,urlbordercolor=0.75 0.75 0.75,bookmarksnumbered=true}
\fancypagestyle{plain}{\fancyhead{}\renewcommand{\headrulewidth}{0pt}}

\date{}
\usepackage{authblk}

\providecommand{\keywords}[1]
{
\footnotesize
  \textbf{\textit{Index terms---}} #1
}

\usepackage{graphicx,xcolor}
\definecolor{GJBlue}{HTML}{273B81}
\definecolor{GJLightBlue}{HTML}{0A9DD9}
\definecolor{GJMediumGrey}{HTML}{6D6E70}
\definecolor{GJLightGrey}{HTML}{929497} 

\renewenvironment{abstract}{%
   \setlength{\parindent}{0pt}\raggedright
   \textcolor{GJMediumGrey}{\rule{\textwidth}{2pt}}
   \vskip16pt
   \textcolor{GJBlue}{\large\bfseries\abstractname\space}
}{%   
   \vskip8pt
   \textcolor{GJMediumGrey}{\rule{\textwidth}{2pt}}
   \vskip16pt
}

\usepackage[absolute,overlay]{textpos}

\makeatother 
      \usepackage{lineno}
      \linenumbers
      
\begin{document}

             \author[1]{Dr.  Manjula}

             \author[2]{Dr.  Jyothi}

             \author[3]{Dr.  Manjula}

             \affil[1]{  SASTRA University}

\renewcommand\Authands{ and }

\date{\small \em Received: 13 December 2012 Accepted: 5 January 2013 Published: 15 January 2013}

\maketitle


\begin{abstract}
        

In recent years, the contemporary data mining community has developed a plethora of algorithms and methods used for different tasks in knowledge discovery within large databases. Furthermore, algorithms become more complex and hybrid as algorithms combining several approaches are suggested, the task of implementing such algorithms from scratch becomes increasingly time consuming. Spatial data sets often contain large amounts of data arranged in multiple layers. These data may contain errors and may not be collected at a common set of coordinates. Therefore, various data pre-processing steps are often necessary to prepare data for further usage. It is important to understand the quality and characteristics of the chosen data. Careful selection, preprocessing, and transformation of the data are needed to ensure meaningful analysis and results.

\end{abstract}


\keywords{data preprocessing, data mining, remote sensing images, deforestation analysis.}

\begin{textblock*}{18cm}(1cm,1cm) % {block width} (coords) 
\textcolor{GJBlue}{\LARGE Global Journals \LaTeX\ JournalKaleidoscope\texttrademark}
\end{textblock*}

\begin{textblock*}{18cm}(1.4cm,1.5cm) % {block width} (coords) 
\textcolor{GJBlue}{\footnotesize \\ Artificial Intelligence formulated this projection for compatibility purposes from the original article published at Global Journals. However, this technology is currently in beta. \emph{Therefore, kindly ignore odd layouts, missed formulae, text, tables, or figures.}}
\end{textblock*}


\let\tabcellsep& 	 	 		 
\section[{Introduction}]{Introduction}\par
he technical progress in computerized data acquisition and storage results in the growth of vast databases. With continues increase and accumulation, the huge amount of the computerized data have far exceeded human ability to completely interpret and use. Users need adequate search tools in order to quickly access and filter relevant information. The development of novel technique and tools in assist for humans aiding in the transformation of data into useful knowledge, has been the heart of the comparatively new and interdisciplinary research areas called "Knowledge Discovery in Databases (KDD)". With rapid growth in development of research in data mining order to quickly access and filter relevant information. The development of novel technique and tools in assist for humans aiding in the transformation of data into useful knowledge, has been the heart of the comparatively new and interdisciplinary research areas called "Knowledge Discovery in Databases (KDD)". With rapid growth in development of research in data mining and data warehouse, many systems were emerged in those fields.\par
It is important to understand the quality and characteristics of the chosen data. Careful selection, preprocessing, and transformation of the data are needed to ensure meaningful analysis and results. What variables should be selected? What measurement framework, such as Euclidean space or non-metric network space, should be used? What spatial relations or contextual information should be considered? Can the chosen data adequately represent the complexity and nature of the problem? a) Study Area\par
The setting of this study spans an area of 5000 Square Kilometers and it includes the mandals of Chittoor such as Thirupathi, Kalahasthi, Yerpedu, Renigunta and major portion of Kadapa Mandals such as Nandalur, Chitvel, Rajampet, Pullampet, Obulavari Palli, Kodur, and Nellore District mandals such as Venkatagiri, Rapur, Kaluya and Takkili. The study area boundary in lat-long is E 79 39" to E 78 45" and N 13 35" to N 14 33". The study area district outline is specified in the Figure  {\ref 1}:   \hyperref[b1]{[3]} proposed the software system for spatial data analysis and modelling (SDAM) which provide flexible machine learning tools for supporting an interactive knowledge discovery process in large centralized or distributed spatial databases. Caroline M. Bruce and David W. Hilbert \hyperref[b2]{[4]} suggested a Pre-processing methodology for application to Landsat T M/ETM+. This report details the various pre-processing techniques either to derive multitemporal and multispatial image classifications or to use in biophysical/geochemical modelling. P.S. Roy et al  {\ref [10]} proposed a multilevel land use land cover classification system, wherein LULC information can be accessed Nationwide, State wide and at the intrastate, regional or municipal level. Stefan Erasmi et al  {\ref [11]} evaluated available satellite data sets and established a transparent work flow for the monitoring of past and future l and cover dynamics at a regional scale based on medium resolution satellite data while mapping deforestation and land cover conversion at the rainforest margin in central Sulawesi, Indonesia. 
\section[{II.}]{II.} 
\section[{Data Preparation}]{Data Preparation}\par
One of the methods for change detection using satellite images is to compare the results of classified images. The advantage of the classified-map comparison method is that not only the location but also the nature and type of the changes are determined in the study area. In this method, first, the images of different times are classified according to the purpose of change detection. Afterward, by overlaying these classified images with a proper overlay condition, the location and amount of these changes that are interested is determined. As the goal is to determine the deforestation, the only two classes that are considered are the forest and non-forest. 
\section[{III.}]{III.} 
\section[{Data Preprocessing}]{Data Preprocessing}\par
Under data preprocessing, the non spatial data are preprocessed with normalization, generalization and other techniques. For the satellite image, the preprocessing is done both at the image dissemination and during feature extraction process. These data are preprocessed to fill data gaps and correct data anomalies. This paper provides a brief description of various preprocessing methods that is applied on the collected images in order to achieve the data quality of the study while classifying the image. 
\section[{a) Part I -Collateral Data Preprocessing}]{a) Part I -Collateral Data Preprocessing}\par
Spatial data sets often contain large amounts of data arranged in multiple layers. These data may contain errors and may not be collected at a common set of coordinates. Spatial data sets often contain large amounts of data arranged in multiple layers. These data may contain errors and may not be collected at a common set of coordinates. Therefore, various data preprocessing steps are often necessary to prepare data for further usage. The following figure explores the preprocessing steps generally used for all type of data \hyperref[b1]{[3]}. Due to the high possibility of measurement noise present in collected data sets, there is a need for data cleaning. Data cleaning consists of removing duplicate data points, and removing value outliers, as well spatial outliers. Data can also be filtered or smoothed by applying a median filter with a window size specified by the user. 
\section[{ii. Data Interpolation}]{ii. Data Interpolation}\par
In many real life spatial domain applications, the resolution will vary among data layers and the data will not be collected at a common set of spatial locations. Therefore, it is necessary to apply an interpolation procedure to the data to change data resolution and to compute values for a common set of locations. Deterministic interpolation techniques such as inverse distance and triangulation can be used but they do not take into account a model of the spatial process or variograms.\par
iii. Data Normalization\par
The system supports two normalization methods: the transformation of data to a normal distribution and the scaling of data to a specified range. In this work, normalization is applied for the image data while georefrencing the three time period based images. 
\section[{iv. Data Discretization}]{iv. Data Discretization}\par
This step is necessary in some modeling techniques like association rules, decision tree learning and all classification problems and includes different attribute and target splitting criteria. In this work discretization is applied for collateral data that includes population data with diversity in data. So this data is discretized into three ranges of groups as 'High', 'Low' and 'Medium'.  
\section[{Feature Selection}]{Feature Selection}\par
In domains with a large number of attributes this step is often beneficial for reducing attribute space by removing irrelevant attributes. Several selection techniques (Forward Selection, Backward Elimination, Branch and Bound) and various criteria (inter-class and probabilistic selection criteria) are supported in order to identify a relevant attribute subset.\par
In this thesis, while preparing a single table input for association rule mining, some of the attributes in individual tables are removed as irrelevant. For deriving rules the attributes such as Gridcode, Area etc are removed as it does not give any meaningful information while deriving rules. Availability, Accessibility, and Affordability of Remote Sensing Data, a range of airborne and spaceborne sensors has acquired remote sensing data, with the number of sensors and their diversity of capability increasing over time. Ideally, the following image characteristics are required for studying defore -station \hyperref[b0]{[1]}  The impact at different times and the influence of these factors on the images must be fully taken into account in the change detection. The influence may be eliminated as much as possible by the geometric registration and radiometric correction on the remote sensing images. 
\section[{Preprocessing and Analysis of the Satellite Images}]{Preprocessing and Analysis of the Satellite Images}\par
Prior to data analysis, initial processing on the raw data is usually carried out to correct for any distortion due to the characteristics of the imaging system and imaging conditions. Depending on the user's requirement, some standard correction procedures may be carried out by the ground station operators before the data is delivered to the end-user. Figure  {\ref 3}.20 derives the processing procedure applied to image data  {\ref [1] [4]} [10]. Figure  {\ref 3}.2 : Processing Procedures Applied to Imagery Data Usually three types of errors occur when a satellite image is generated by the satellite sensor. The first is the sensor error. The second is the error created by the atmospheric parameters, which affect the amount of radiation received by the sensor. The third one is the geometric errors related to the curvature of the Earth surface, the Earth rotation, elevation differences, location and situation of the satellite etc. Therefore, these errors should be considered and managed before using the data:\par
1. Sensor Errors: The two images used were already corrected by their providers. Therefore, there was no need for any processing in this regard. 
\section[{Radiometric Correction:}]{Radiometric Correction:}\par
The Earth atmosphere scatters the shorter wavelengths in a selective manner and this reduces the contrast of the image. The numerical value of each pixel in the image is not a realistic representation of the amount of radiation from the ground surface. These values are changed either by atmospheric absorption or by scattering throughout the atmosphere.\par
3. Atmospheric Effects: Scattering and absorption of EM radiation by the atmosphere have significant effects that impact sensor design as well as the processing and interpretation of images. When the concentration of scattering agents is high, scattering produces the visual effect we call haze. Haze increases the overall brightness of a scene and reduces the contrast between different ground materials. In general, atmospheric errors are discussed in three parts: the Haze, Sun angle and Skylight errors.\par
Atmospheric corrections are required in the following situations: ? When user want to compare the images related to different times. ? When using methods such as image subtraction and image division for change detection, the effect of atmosphere on the two images related to different times are quite different. ? When the ratio of two bands of an image is needed to be calculated, because the atmosphere has different effects on different wavelengths. ? When user want to study spectral characteristics of different phenomena.\par
If user wanted to use the division or subtraction of images for determining the changes in forest land use, then user would have to correct for the haze, sun angle and skylight errors \hyperref[b2]{[4]}. In this approach the results of the land use classification maps extracted from the three images are compared. The classification of land use can be done better and more accurate with the raw (unprocessed) images. Therefore, there was no need for the above corrections for images used in this study. ? Geometric Corrections: The process and analysis of multi-temporal data can be done only when they are geo-referenced similarly, or in another words, when they are geo-referenced to each other  {\ref [11]}. The images of this study had to be geo-referenced to each other with an accuracy of one pixel. Otherwise, the error coming from different coordinates for similar objects in the two images can be wrongly accepted as a land use change. To prevent such a problem, in comparison of multi-temporal images, geo-reference one of the images using the available topographic maps and then geo-referencing the other images according to the first one, i.e. using image-to-image registration is done.\par
In photo/image registration (geo-referencing), the most important task is the proper selection of control points, especially when there is a long time period between the map and the image. In this work, the first order polynomial equations for geo-referencing of the images is used, which remove the errors related to the rotation and scaling of the image. The image may also be transformed to conform to a specific map projection system. Furthermore, if accurate geographical location Year of an area on the image needs to be known, ground control points (GCP's) are used to register the image to a precise map (geo-referencing).\par
In this study, the ETM+ image of the year 2001 was first geo-referenced using the information in its header approximately. Then, it was geo-referenced accurately using the available 1:25000 digital maps and the digitized features of the 1:50000 maps of the area. Afterward, the TM image of 1991 was geo-referenced using the already registered TM image. For georeferencing the 2001 image 18 control points were used initially. Every control point with an RMSE or residual error bigger than a pixel size was removed from the calculation and the process of registration was repeated with the rest of the control points. Finally, 10 points with the average error of 01.00 meters remained and were used for registration. For image-to-image registration of the 1991 image 20 control points were initially used. Finally, 6 points were removed and the image was georeferenced using the remained 14 points with the RMSE of 0.92 meters.\par
All images and aerial photographs were rectified to UTM zone 39 N with at least 25 well distributed ground control points. At first geometric correction was carried out using topographic maps with the scale of 1:25000 to geo code aerial photos. Also for geometric correction of the 2001 IRS-1C land sat image, topographic maps with the scale of 1:25000 were used and then this rectified image was employed to register the 2011 LISS-III image. Geometric correction of Land sat TM image of 1990 was carried out by the use of IRS-P6 LISS-III image. Finally, a first-order polynomial model was applied and all data were resampled to a 30 m pixel size using the nearest neighbour method. After geometric correction of aerial photos, all photos for each year were mosaic ked to prepare one image for land cover mapping.\par
? Image Enhancement: In order to aid visual interpretation, visual appearance of the objects in the image can be improved by image enhancement techniques such as grey level stretching to improve the contrast and spatial filtering for enhancing the edges \hyperref[b2]{[4]}. The goal of image enhancement is to improve the visual interpretability of an image by increasing the distinction between features. In this study, two false colour composites (FCC) are produced for selecting training samples. Also image fusion was done to increase spatial resolution of the LISS-III image. LISS-III image was fused with IRS-1C PAN image to generate an image with high spatial resolution \hyperref[b0]{[1]}. Land sat TM enhanced false colour composites RGB (red, green, blue) 4,5,3; 5,3,2; 4,5,7 and 4,3,2 are used for the interpretation and delimitation of the land cover classes  {\ref [11]}. Interpretation and vectorization on the screen, available in Arc Info format was the preferred vector format and can be directly transformed to a land cover map.\par
? Neighborhood Filling: This method has been used to clean and fill the missing cell in the image while doing image classification.\par
? Edge Matching: This features is carried out to maintain the continuity of classes between adjoining mandals/districts/states. Generation of seamless geo data set at district/state level, creation of metadata, class wise area statistics are prepared.\par
? Aerial Photos Interpretation: Land cover pattern is interpreted visually on black and white aerial photographs and simultaneously digitized with the Arcmap software. Identifying features in aerial photos is performed based on tone, texture, pattern, size and shape. 
\section[{Conclusion}]{Conclusion}\par
Data mining is data-driven but also, more importantly, human-centered, with the user controlling the selection and integration of data, cleaning and transformation of the data, choice of analysis methods, and the interpretation of results. The abundance of spatial data provides exciting opportunities for new research directions but also demands caution in using these data. The data are often from different sources and collected for different purposes under various conditions, such as measurement uncertainty, biased sampling, varying area unit, and confidentiality constraint. It is important to understand the quality and characteristics of the chosen data. Careful selection, preprocessing, and transformation of the data are needed to ensure meaningful analysis and results.Preprocessing improves performance, but massive data volumes associated with encoding spatial relationships for all combinations of geographic objects prohibits the storage of all spatial relationships.  \begin{figure}[htbp]
\noindent\textbf{11113}\includegraphics[]{image-2.png}
\caption{\label{fig_0}Figure 1 . 1 :Figure 1 Figure 1 . 3 :?}\end{figure}
 \begin{figure}[htbp]
\noindent\textbf{31}\includegraphics[]{image-3.png}
\caption{\label{fig_1}Figure 3 . 1 :}\end{figure}
 \begin{figure}[htbp]
\noindent\textbf{}\includegraphics[]{image-4.png}
\caption{\label{fig_2}}\end{figure}
 \begin{figure}[htbp]
\noindent\textbf{}\includegraphics[]{image-5.png}
\caption{\label{fig_3}}\end{figure}
 \begin{figure}[htbp]
\noindent\textbf{}\includegraphics[]{image-6.png}
\caption{\label{fig_6}C}\end{figure}
 \begin{figure}[htbp]
\noindent\textbf{1} \par 
\begin{longtable}{P{0.26062717770034843\textwidth}P{0.23101045296167247\textwidth}P{0.13475609756097562\textwidth}P{0.16585365853658537\textwidth}P{0.05775261324041812\textwidth}}
\tabcellsep \multicolumn{4}{l}{1 : Various Inputs used in the Study}\\
S.No\tabcellsep Type of Map\tabcellsep Resolution/ Scale\tabcellsep Date/Year of Acquisition\tabcellsep Source\\
\tabcellsep \tabcellsep 1:50,000\tabcellsep 57 O/5 -1973-79\tabcellsep SOI\\
1\tabcellsep Topsheet\tabcellsep 1:50,000\tabcellsep 57 J/11 -1973\tabcellsep SOI\\
\tabcellsep \tabcellsep 1:50,000\tabcellsep 57 O/6 -1973\tabcellsep SOI\\
\tabcellsep \tabcellsep 1:50,000\tabcellsep 57 N/9 -1973\tabcellsep SOI\\
2\tabcellsep Landsat -TM\tabcellsep 28.5 mt\tabcellsep 1991\tabcellsep GLCF\\
3\tabcellsep Landsat -ETM+LISS 3\tabcellsep Medium 250,000\tabcellsep 05 th April, 2001\tabcellsep NRSC\\
4\tabcellsep IRS P6. LISS 3 101 -63\tabcellsep Medium 250,000\tabcellsep 6 th Feb, 2010\tabcellsep NRSC\\
5\tabcellsep Mandal Maps\tabcellsep A3 Size\tabcellsep -\tabcellsep Mandal HQ\\
\multicolumn{3}{l}{Review of Literature}\tabcellsep \tabcellsep \\
\tabcellsep \multicolumn{4}{l}{Amos Storkey [2] proposed various data}\\
\multicolumn{5}{l}{preprocessing methods applied on any data before}\\
\multicolumn{5}{l}{applying data mining techniques to ensure the quality of}\\
\multicolumn{5}{l}{decision making. Aleksandar Lazarevic et al}\end{longtable} \par
 
\caption{\label{tab_0}Table 1 .}\end{figure}
 \begin{figure}[htbp]
\noindent\textbf{3} \par 
\begin{longtable}{P{0.6585585585585585\textwidth}P{0.13018018018018016\textwidth}P{0.06126126126126126\textwidth}}
Population Size \& Growth(Difference)\tabcellsep Density = Population / Area\tabcellsep Range Label\\
500 <\tabcellsep <100\tabcellsep Low\\
>=500<1000\tabcellsep >=100 and < 200\tabcellsep Medium\\
>=1000\tabcellsep > 200\tabcellsep High\\
\multicolumn{2}{l}{v. Generating New Attributes}\tabcellsep \\
\multicolumn{3}{l}{Users can generate new attributes by applying}\\
\multicolumn{3}{l}{supported to a set of existing attributes. The}\\
\multicolumn{3}{l}{density range, population range etc., are created as new}\\
\multicolumn{2}{l}{attributes for the study.}\tabcellsep \end{longtable} \par
 
\caption{\label{tab_1}Table 3 .}\end{figure}
 \begin{figure}[htbp]
\noindent\textbf{} \par 
\begin{longtable}{P{0.85\textwidth}}
? Cloud free and clear atmosphere during the time of\\
data acquisition;\\
? Availability of imagery for the optimum date or\\
dates;\\
? Spatial resolution fine enough for accurate mapping\\
and course enough so image size is manageable;\\
? Band selection (band width, placement, and\\
number of bands) optimized to identify features of\\
interest;\\
? Study area covered on a single image;\\
? Same sensor and sun position when images were\\
acquired similar atmospheric conditions.\\
? Pragmatically, it is rather difficult to acquire the data\\
with the above characteristics. Instead, the following\\
problems are common in data acquisition process:\\
? Unavailability of data for specific time period;\\
? Persistent cloud coverage throughout the year and\\
for many years;\\
? Cost is too high specially for commercial satellite\\
data;\\
? Availability of data in usable format (digital or hard\\
copy);\\
? Cost of processing, in producing value added\\
product,\\
? Lack of expertise, equipment/software for analysis;\\
? Significant improvements have been made in terms\\
of spectral, spatial, temporal and radiometric\\
resolutions. More specifically, improvements have\\
been observed in\\
? Visibility and clarity that includes more detailed\\
image of a smaller piece of land;\\
? Clear definition involving more precisely the specific\\
colours or light responses reflecting off of the field;\\
and\\
? Frequent data acquisition on a regular interval of\\
every other day or every 5-7 days.\\
? The background environment reflected through the\\
remote sensing image obtained in different instant is\\
different because of the influence of various factors\\
in the acquisition process. These factors can be\\
divided into two categories: remote sensing system\\
factors and environmental factors.\\
? The remote sensing system factors are: the impact\\
of temporal, spatial, spectral and radiation\\
resolution.\\
? The environmental factors are: The impact of\\
atmospheric conditions, soil moisture and\\
phonological characteristics.\end{longtable} \par
 
\caption{\label{tab_2}}\end{figure}
 		 		\backmatter  			  				\begin{bibitemlist}{1}
\bibitem[Luis Otavo Alvares et al.]{b5}\label{b5} 	 		\textit{A Framework for Trajectory Data Preprocessing for Data Mining},  		 			Gabriel Luis Otavo Alvares 		,  		 			Vania Oliveira 		,  		 			Bogorny 		.  		 \url{http://www.inf.ufsc.br/\textasciitilde vania/artigos/seke2009\textunderscore 6.pdf}  		 	 
\bibitem[Lazarevic et al.]{b1}\label{b1} 	 		‘A Software System for Spatial Data Analysis and Modeling’.  		 			Aleksandra Lazarevic 		,  		 			Tim Fiez 		,  		 			Zoran Obradovic 		.  		 \url{www.ist.-temple.edu/\textasciitilde zoran/papers/lazarevic00.pdf}  	 	 		\textit{INEEL University Research Consortium project}  		p. .  	 
\bibitem[Loveland et al. ()]{b7}\label{b7} 	 		\textit{A strategy for estimating the rates of recent United States landcover changes. Photogrammetric Engineering and Remote Sensing},  		 			T R Loveland 		,  		 			T L Sohl 		,  		 			Stedman S V Gallant 		,  		 			A L Saylor 		,  		 			K Nap Ton 		,  		 			DE 		.  		2002. 68 p. .  	 
\bibitem[Arms Ton et al. ()]{b0}\label{b0} 	 		‘Geometric Correction of Land sat MSS,TM and ETM+Imagery for Mapping of Woody Vegetation Cover and Change Detection in Queensland’.  		 			J D Arms Ton 		,  		 			T J Danaher 		,  		 			B Goulevitch 		,  		 			M Byrne 		.  		 \url{www.nrm.-qld.gov.au/slats}  	 	 		\textit{Climate Impacts and Natural Resource Systems},  				2002. p. .  	 
\bibitem[Dwivedi (ed.) ()]{b8}\label{b8} 	 		\textit{Mapping Deforestation and Land Cover Conversion at The Rainforest Margin in Central Sulawesi},  		 			Roy P S Dwivedi 		,  		 			R 		.  		11. Stefan Erasmi, Andre Twele, Muhammad Ardiansyah, Adam Malik and Martin Kappas (ed.)  		2011. Indonesia.  		 			National Remote Sensing Centre 		 	 	 (Remote Sensing Applications-Land Use Land Cover Analysis. EAR SeL proceedings 3, 2004. Data Preprocessing in Multi-Temporal Remote Sensing Data for Deforestation Analysis) 
\bibitem[Bruce and Hilbert (2006)]{b2}\label{b2} 	 		‘Preprocessing Methodology for Application to Land sat TM/ETM+ Imagery of the Wet Tropics’.  		 			Caroline M Bruce 		,  		 			David W Hilbert 		.  	 	 		\textit{Cooperative Research Centre for Tropical Rainforest Ecology and Management. Rainforest CRC}  		March 2006.  	 	 (www.rainforest-crc.jcu.edu.au) 
\bibitem[Principles of Remote Sensing-Centre for Remote Imaging, Sensing and Processing]{b3}\label{b3} 	 		 \url{CRISP,www.crisp.nus.edu.sg/\textasciitilde research/tutorial/rsmain.html}  		\textit{Principles of Remote Sensing-Centre for Remote Imaging, Sensing and Processing},  				 	 
\bibitem[Lilles and Keifer ()]{b6}\label{b6} 	 		\textit{Remote Sensing and Image Interpretation},  		 			T M Lilles 		,  		 			W Keifer 		.  		1994. New York: John Wiley.  	 
\bibitem[Hutchinson ()]{b4}\label{b4} 	 		‘Techniques for Combining Land sat and Ancillary Data for Digital Classification Improvement’.  		 			C Hutchinson 		.  	 	 		\textit{Photogrammetric Engineering and Remote Sensing}  		1982. 48  (1)  p. .  	 
\end{bibitemlist}
 			 		 	 
\end{document}