@incollection{, 7B7E61C0C5FCE175B34EEF305BBE8F56 , author={{Ramya RS} and {Venugopal KR} and {University Visvesvaraya College of Engineering, UVCE}}, journal={{Global Journal of Computer Science and Technology}}, journal={{GJCST}}0975-41720975-435010.34257/gjcst, address={Cambridge, United States}, publisher={Global Journals Organisation}165120 } @incollection{b0, , title={{A Detailed Study on Text Mining Techniques}} , author={{ RAgrawal } and { MBatra }} , journal={{International Journal of Soft Computing and Engineering (IJSCE) ISSN}} 2 6 , year={2013} } @incollection{b1, , title={{A Data Mining Approach for Data Generation and Analysis for Digital Forensic Application}} , author={{ VHBhat } and { PGRao } and { RAbhilash } and { PDShenoy } and { KRVenugopal } and { LPatnaik }} , journal={{International Journal of Engineering and Technology}} 2 3 , year={2010} } @incollection{b2, , title={{A Review on Text Mining}} , author={{ YZhang } and { MChen } and { LLiu }} , booktitle={{Proceedings of 6th IEEE International Conference on Software Engineering and Service Science (ICSESS)}} 6th IEEE International Conference on Software Engineering and Service Science (ICSESS) , year={2015} } @incollection{b3, , title={{An Efficient Concept-based Mining Model for Enhancing Text Clustering}} , author={{ SShehata } and { FKarray } and { MSKamel }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 22 10 , year={2010} } @incollection{b4, , title={{A Novel Data Generation Approach for Digital Forensic Application in Data Mining}} , author={{ VHBhat } and { PGRao } and { RAbhilash } and { PDShenoy } and { KRVenugopal } and { LPatnaik }} , booktitle={{Proceedings of Second International Conference on Machine Learning and Computing (ICMLC)}} Second International Conference on Machine Learning and Computing (ICMLC) , year={2010} } @incollection{b5, , title={{Text Mining the Contributors to Rail Accidents}} , author={{ DEBrown }} , journal={{IEEE Transactions on Intelligent Transportation Systems}} 27 5 , year={2015} } @book{b6, , title={{Soft Computing for Data Mining Applications}} , author={{ KRVenugopal } and { KSrinivasa } and { LMPatnaik }} , year={2009} , publisher={Springer} } @incollection{b7, , title={{Text Mining and Information Professionals: Role, Issues and Challenges}} , author={{ VKVerma } and { MRanjan } and { PMishra }} , booktitle={{Proceedings of 4th International Symposium on Emerging Trends and Technologies in Libraries and Information Services (ETTLIS)}} 4th International Symposium on Emerging Trends and Technologies in Libraries and Information Services (ETTLIS) , year={2015} } @incollection{b8, , title={{Text mining: Challenges and Future Directions}} , author={{ AAkilan }} , booktitle={{Proceedings of Second International Conference on Electronics and Communication Systems (ICECS)}} Second International Conference on Electronics and Communication Systems (ICECS) , year={2015} } @incollection{b9, , title={{Text Knowledge Mining:An Alternative to Text Data Mining}} , author={{ DSanchez } and { MJMartin-Bautista } and { IBlanco } and { CTorre }} , booktitle={{Proceedings of IEEE International Conference on Data Mining Workshops(ICDMW)}} IEEE International Conference on Data Mining Workshops(ICDMW) , year={2008} } @incollection{b10, , title={{Minedec:A Decision-Support Model that Combines Textmining Technologies with Two Competitive Intelligence Analysis Methods}} , author={{ YDai } and { TKakkonen } and { ESutinen }} , journal={{International Journal of Computer Information Systems and Industrial Management Applications}} 3 10 , year={2011} } @incollection{b11, , title={{Ppsgen: Learning-Based Presentation Slides Generation for Academic Papers}} , author={{ YHu } and { XWan }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 27 4 , year={2015} } @incollection{b12, , title={{Real-Time Detection of Traffic from Twitter Stream Analysis}} , author={{ ED'andrea } and { PDucange } and { BLazzerini } and { FMarcelloni }} , journal={{IEEE Transactions on Intelligent Transportation Systems}} 16 4 , year={2015} } @incollection{b13, , title={{}} , author={{ RLi } and { KHLei } and { RKhadiwala } and { K. C.-CChang }} , journal={{Tedas: A Twitter-based Event Detection}} } @incollection{b14, , title={{Classification of Email using Beaks: Behavior and Keyword Stemming}} , author={{ VHBhat } and { VRMalkani } and { PDShenoy } and { KRVenugopal } and { LPatnaik }} , booktitle={{Proceedings of IEEE Region 10 Conference TENCON}} IEEE Region 10 Conference TENCON , year={2011} } @incollection{b15, , title={{I See a Car Crash: Real-Time Detection of Small Scale Incidents in Microblogs}} , author={{ ASchulz } and { PRistoski } and { HPaulheim }} , booktitle={{The Semantic Web: ESWC Satellite Events}} , year={2013} } @incollection{b16, , title={{Text Detection and Recognition on Traffic Panels from Street-Level Imagery using Visual Appearance}} , author={{ AGonzalez } and { LMBergasa } and { JJYebes }} , journal={{IEEE Transactions on Intelligent Transportation Systems}} 15 1 , year={2014} } @incollection{b17, , title={{Genetic Programming for Simultaneous Feature Selection and Classifier Design}} , author={{ DPMuni } and { NRPal } and { JDas }} , journal={{IEEE Transactions on Systems, Man, and Cybernetics}} 36 1 , year={2006} , note={Part B (Cybernetics)} } @incollection{b18, , title={{Text Feature Selection Using Ant Colony Optimization}} , author={{ MHAghdam } and { NGhasem-Aghaee } and { MEBasiri }} , journal={{Expert Systems with Applications}} 36 3 , year={2009} } @incollection{b19, , title={{Generic Feature Extraction for Classification using Fuzzy C-means Clustering}} , author={{ KSrinivasa } and { ASingh } and { AThomas } and { KRVenugopal } and { LPatnaik }} , booktitle={{Proceedings of 3rd International Conference on Intelligent Sensing and Information Processing}} 3rd International Conference on Intelligent Sensing and Information Processing , year={2005} } @incollection{b20, , title={{Eliminating Redundancy and Irrelevance using a New Mlp-based Feature Selection Method}} , author={{ EGasca } and { JSS´anchez } and { RAlonso }} , journal={{Pattern Recognition}} 39 2 , year={2006} } @incollection{b21, , title={{Computer Science and Technology Volume XVI Issue V Version I C Analysis System}} , booktitle={{Proceedings of IEEE 28th International Conference on Data Engineering (ICDE)}} IEEE 28th International Conference on Data Engineering (ICDE) , year={2012} } @incollection{b22, , title={{Et: Events from Tweets}} , author={{ RParikh } and { KKarlapalem }} , booktitle={{Proceedings of the 22nd International Conference on World Wide Web Companion}} the 22nd International Conference on World Wide Web Companion , year={2013} } @incollection{b23, , title={{A Hybrid Approach for Feature Subset Selection using Neural Networks and Ant Colony Optimization}} , author={{ RKSivagaminathan } and { SRamakrishnan }} , journal={{Expert systems with Applications}} 33 1 , year={2007} } @incollection{b24, , title={{Unsupervised Feature Selection for Multi-cluster Data}} , author={{ DCai } and { CZhang } and { XHe }} , booktitle={{Proceedings of the 16th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining}} the 16th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining , year={2010} } @incollection{b25, , title={{Graph Regularized Feature Selection with Data Reconstruction}} , author={{ ZZhao } and { XHe } and { DCai } and { LZhang } and { WNg } and { YZhuang }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 28 3 , year={2016} } @incollection{b26, , title={{Microblog Dimensionality Reduction-A Deep Learning Approach}} , author={{ LXu } and { CJiang } and { YRen } and { H.-HChen }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 28 7 , year={2016} } @incollection{b27, , title={{Feature Selection via Global Redundancy Minimization}} , author={{ DWang } and { FNie } and { HHuang }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 27 10 , year={2015} } @incollection{b28, , title={{Feature Selection with a Measure of Deviations from Poisson in Text Categorization}} , author={{ HOgura } and { HAmano } and { MKondo }} , journal={{Expert Systems with Applications}} 36 3 , year={2009} } @incollection{b29, , title={{Comparison of Term Frequency and Document Frequency based Feature Selection Metrics in Text Categorization}} , author={{ NAzam } and { JYao }} , journal={{Expert Systems with Applications}} 39 5 , year={2012} } @incollection{b30, , title={{Graph Embedding and Extensions: A General Framework for Dimensionality Reduction}} , author={{ SYan } and { DXu } and { BZhang } and { H.-JZhang } and { QYang } and { SLin }} , journal={{IEEE Transactions on Pattern Analysis and Machine Intelligence}} 29 1 , year={2007} } @incollection{b31, , title={{On Similarity Preserving Feature Selection}} , author={{ ZZhao } and { LWang } and { HLiu } and { JYe }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 25 3 , year={2013} } @incollection{b32, , title={{Graph Regularized Feature Selection with Data Reconstruction}} , author={{ ZZhao } and { XHe } and { LZhang } and { WNg } and { YZhuang }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 28 3 , year={2016} } @incollection{b33, , title={{Unsupervised Feature Selection for Linked Social Media Data}} , author={{ JTang } and { HLiu }} , booktitle={{Proceedings of the 18th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining}} the 18th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining , year={2012} } @incollection{b34, , title={{Harvesting Domain Specific Ontologies from Text}} , author={{ HMousavi } and { DKerr } and { MIseli } and { CZaniolo }} , booktitle={{Proceedings of IEEE International Conference on Semantic Computing (ICSC)}} IEEE International Conference on Semantic Computing (ICSC) , year={2014} } @incollection{b35, , title={{1-norm Regularized Discriminative Feature Selection for Unsupervised Learning}} , author={{ YYang } and { HTShen } and { ZMa } and { ZHuang } and { XZhou }} , booktitle={{Proceedings of the International Joint Conference on Artificial Intelligence(IJCAI)}} the International Joint Conference on Artificial Intelligence(IJCAI) , year={2011} 2 } @incollection{b36, , title={{Graph Regularized Nonnegative Matrix Factorization for Data Representation}} , author={{ DCai } and { XHe } and { JHan } and { TSHuang }} , journal={{IEEE Transactions on Pattern Analysis and Machine Intelligence}} 33 8 , year={2011} } @incollection{b37, , title={{Qrgqr: Query Relevance Graph for Query Recommendation}} , author={{ DSejal } and { KShailesh } and { VTejaswi } and { DAnvekar } and { KRVenugopal } and { SIyengar } and { LPatnaik }} , booktitle={{Proceedings of IEEE Region 10 Symposium (TENSYMP)}} IEEE Region 10 Symposium (TENSYMP) , year={2015} } @incollection{b38, , title={{Unsupervised Hybrid Feature Extraction Selection for High-Dimensional Non-Gaussian Data Clustering with Variational Inference}} , author={{ WFan } and { NBouguila } and { DZiou }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 25 7 , year={2013} } @incollection{b39, , title={{A Survey of Text Summarization Extractive Techniques}} , author={{ VGupta } and { GS }} , journal={{Journal of Emerging Technologies in Web Intelligence}} 2 3 , year={2010} } @incollection{b40, , title={{Text Summarization for Information Retrieval using Pattern Recognition Techniques}} , author={{ PSNegi } and { MRauthan } and { HDhami }} , journal={{International Journal of Computer Applications}} 21 10 , year={2011} } @incollection{b41, , title={{An Analysis of the Relative Hardness of Reuters-21578 Subsets}} , author={{ FDebole } and { FSebastiani }} , journal={{Journal of the American Society for Information Science and Technology}} 56 6 , year={2005} } @incollection{b42, , title={{Keyphrase Extraction based on Semantic Relatedness}} , author={{ FXie } and { XWu } and { XHu }} , booktitle={{Proceedings of 9th IEEE International Conference on Cognitive Informatics (ICCI)}} 9th IEEE International Conference on Cognitive Informatics (ICCI) , year={2010} } @incollection{b43, , title={{Mining Positive andNegative Patterns for Relevance Feature Discovery}} , author={{ YLi } and { AAlgarni } and { NZhong }} , booktitle={{Proceedings of the 16th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining}} the 16th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining , year={2010} } @incollection{b44, , title={{Effective Pattern Discovery for Text Mining}} , author={{ NZhong } and { YLi } and { S.-TWu }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 24 1 , year={2012} } @incollection{b45, , title={{Mining Temporal Patterns in Time Interval-Based Data}} , author={{ Y.-CChen } and { W.-CPeng } and { S.-Y.Lee }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 27 12 , year={2015} } @incollection{b46, , title={{Inference of Regular Expressions for Text Extraction from Examples}} , author={{ ABartoli } and { ALorenzo } and { EMedvet } and { FTarlao }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 28 5 , year={2016} } @incollection{b47, , title={{Relevance Feature Discovery for Text Mining}} , author={{ YLi } and { AAlgarni } and { MAlbathan } and { YShen } and { MABijaksana }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 27 6 , year={2015} } @incollection{b48, , title={{A Fast Clusteringbased Feature Subset Selection Algorithm for High-Dimensional Data}} , author={{ QSong } and { JNi } and { GWang }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 25 1 , year={2013} } @incollection{b49, , title={{Review Selection Using Micro-Reviews}} , author={{ T.-SNguyen } and { HWLauw } and { PTsaparas }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 27 4 , year={2015} } @incollection{b50, , title={{Feature Extraction for Co-occurrence-based Cosine Similarity Score of Text Documents}} , author={{ AIKadhim } and { YCheah } and { NHAhamed } and { LASalman }} , booktitle={{Proceedings of IEEE Student Conference on Research and Development (SCOReD)}} IEEE Student Conference on Research and Development (SCOReD) , year={2014} } @incollection{b51, , title={{Experiments with Random Projections for Machine Learning}} , author={{ DFradkin } and { DMadigan }} , booktitle={{Proceedings of the Ninth ACM SIGKDD International Conference on Knowledge Discovery and Data Mining}} the Ninth ACM SIGKDD International Conference on Knowledge Discovery and Data Mining , year={2003} } @incollection{b52, , title={{Classification of Alzheimer's Disease and Parkinson's Disease by using Machine Learning and Neural Network Methods}} , author={{ SJoshi } and { DShenoy } and { PRashmi } and { KRVenugopal } and { LPatnaik }} , booktitle={{Proceedings of Second International Conference on Machine Learning and Computing (ICMLC)}} Second International Conference on Machine Learning and Computing (ICMLC) , year={2010} } @incollection{b53, , title={{Applying Data Mining Techniques for Descriptive Phrase Extraction in Digital Document Collections}} , author={{ HAhonen } and { OHeinonen } and { MKlemettinen } and { AIVerkamo }} , booktitle={{Proceedings of IEEE International Forum on Research and Technology Advances in Digital Libraries}} IEEE International Forum on Research and Technology Advances in Digital Libraries , year={1998} } @incollection{b54, , title={{Clospan: Mining Closed Sequential Patterns in Large Datasets}} , author={{ XYan } and { JHan } and { RAfshar }} , booktitle={{SDM}} , year={2003} } @incollection{b55, , title={{Clasp: An Efficient Algorithm for Mining Frequent Closed Sequences}} , author={{ AGomariz } and { MCampos } and { RMarin } and { BGoethals }} , booktitle={{Advances in Knowledge Discovery and Data Mining}} , year={2013} } @incollection{b56, , title={{Closet: An Efficient Algorithm for Mining Frequent Closed Itemsets}} , author={{ JPei } and { JHan } and { RMao }} , journal={{ACM SIGMOD Workshop on Research Issues in Data Mining and Knowledge Discovery}} 4 2 , year={2000} } @incollection{b57, , title={{Freespan: Frequent Pattern-Projected Sequential Pattern Mining}} , author={{ JHan } and { JPei } and { BMortazavi-Asl } and { QChen } and { UDayal } and { M.-CHsu }} , booktitle={{Proceedings of the Sixth ACM SIGKDD International Conference on Knowledge Discovery and Data Mining}} the Sixth ACM SIGKDD International Conference on Knowledge Discovery and Data Mining , year={2000} } @incollection{b58, , title={{Prefixspan: Mining Sequential Patterns Efficiently by Prefix-Projected Pattern Growth}} , author={{ JPei } and { JHan } and { BMortazavi-Asl } and { HPinto } and { QChen } and { UDayal } and { M.-CHsu }} , journal={{ICCN}} , year={2001} } @book{b59, , title={{Mastering c++}} , author={{ KRVenugopal } and { RBuyya }} , year={2013} , publisher={Tata McGraw-Hill Education} } @book{b60, , title={{Spirit: Sequential Pattern Mining with Regular Expression Constraints}} , author={{ MNGarofalakis } and { RRastogi } and { KShim }} , year={1999} 99 , note={VLDB} } @incollection{b61, , title={{Effective Pattern Discovery for Text Mining}} , author={{ NZhong } and { YLi } and { S.-TWu }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 24 1 , year={2012} } @incollection{b62, , title={{Operational Pattern Revealing Technique in Text Mining}} , author={{ AInje } and { UPatil }} , booktitle={{Proceedings of IEEE Students' Conference on Electrical, Electronics and Computer Science (SCEECS)}} IEEE Students' Conference on Electrical, Electronics and Computer Science (SCEECS) , year={2014} } @incollection{b63, , title={{Efficiently Mining Long Patterns from Databases}} , author={{ RJBayardoJr }} , journal={{ACM Sigmod Record}} 27 2 , year={1998} } @incollection{b64, , title={{A Comparative Study on Feature Selection in Text Categorization}} , author={{ YYang } and { JOPedersen }} , journal={{ICML}} 97 , year={1997} } @incollection{b65, , title={{Dynamic Association Rule Mining using Genetic Algorithms}} , author={{ PDShenoy } and { KSrinivasa } and { LMVenugopal } and { Patnaik }} , journal={{Intelligent Data Analysis}} 9 5 , year={2005} } @incollection{b66, , title={{Slpminer: An Algorithm for Finding Frequent Sequential Patterns using Length-Decreasing Support Constraint}} , author={{ MSeno } and { GKarypis }} , booktitle={{Proceedings of IEEE International Conference on Data Mining}} IEEE International Conference on Data Mining , year={2002} } @incollection{b67, , title={{A Taxonomy of Sequential Pattern Mining Algorithms}} , author={{ NRMabroukeh } and { CIEzeife }} , journal={{ACM Computing Surveys (CSUR)}} 43 1 , year={2010} } @incollection{b68, , title={{Spade: An Efficient Algorithm for Mining Frequent Sequences}} , author={{ MJZaki }} , journal={{Machine learning}} 42 1-2 , year={2001} } @incollection{b69, , title={{Mining Frequent Patterns without Candidate Generation: A Frequent-Pattern Tree Approach}} , author={{ JHan } and { JPei } and { YYin } and { RMao }} , journal={{Data Mining and Knowledge Discovery}} 8 1 , year={2004} } @incollection{b70, , title={{Mining Closed Sequential Patterns in Large Sequence Databases}} , author={{ VPRaju } and { GSVarma }} , journal={{International Journal of Database Management Systems}} 7 1 , year={2015} } @incollection{b71, , title={{Interrelation Analysis of Celestial Spectra Data using Constrained Frequent Pattern Trees}} , author={{ JZhang } and { XZhao } and { SZhang } and { SYin } and { XQin } and { ISenior } and { Member }} , journal={{Knowledge-Based Systems}} 41 4 , year={2013} } @incollection{b72, , title={{Distributed Data Management using Mapreduce}} , author={{ FLi } and { BCOoi } and { MT } and { SWu }} , journal={{ACM Computing Surveys (CSUR)}} 46 3 , year={2014} } @incollection{b73, , title={{Classification Framework of Mapreduce Scheduling Algorithms}} , author={{ NTiwari } and { SSarkar } and { UBellur } and { MIndrawan }} , journal={{ACM Computing Surveys (CSUR)}} 47 3 , year={2015} } @incollection{b74, , title={{Fidoop: Parallel Mining of Frequent Itemsets Using Mapreduce}} , author={{ YXun } and { JZhang } and { XQin }} , journal={{IEEE Transactions on Systems, Man, and Cybernetics: Systems}} 46 3 , year={2016} } @incollection{b75, , title={{The Family of Mapreduce and Large-Scale Data Processing Systems}} , author={{ SSakr } and { ALiu } and { AGFayoumi }} , journal={{ACM Computing Surveys (CSUR)}} 46 1 , year={2013} } @incollection{b76, , title={{An Efficient Algorithm of Frequent Itemsets Mining based on Mapreduce}} , author={{ LWang } and { LFeng } and { JZhang } and { PLiao }} , journal={{Journal of Information and Computational Science}} 11 8 , year={2014} } @incollection{b77, , title={{Mining Interesting Infrequent Itemsets from Very Large Data based on Mapreduce Framework}} , author={{ TRamakrishnudu } and { RSubramanyam }} , journal={{International Journal of Intelligent Systems and Applications}} 7 7 , year={2015} } @incollection{b78, , title={{Parallel Frequent Item Set Mining with Selective Item Replication}} , author={{ EOzkural } and { BUcar } and { CAykanat }} , journal={{IEEE Transactions on Parallel and Distributed Systems}} 22 10 , year={2011} } @incollection{b79, , title={{Active Relevance Feedback for Difficult Queries}} , author={{ ZXu } and { RAkella }} , booktitle={{Proceedings of the 17th ACM Conference on Information and Knowledge Management}} the 17th ACM Conference on Information and Knowledge Management , year={2008} } @incollection{b80, , title={{User Feedback Session with Clicked and Unclicked Documents for Related Search Recommendation}} , author={{ SDesai } and { VChandrasheker } and { VMathapati } and { KR VRajuk } and { SSIyengar } and { LMPatnaik }} , journal={{IADIS-International Journal on Computer Science and Information Systems}} 11 1 , year={2016} } @incollection{b81, , title={{Selecting Good Expansion Terms for Pseudo-Relevance Feedback}} , author={{ GCao } and { J.-YNie } and { JGao } and { SRobertson }} , booktitle={{Proceedings of the 31st Annual International ACM SIGIR Conference on Research and Development in Information Retrieval}} the 31st Annual International ACM SIGIR Conference on Research and Development in Information Retrieval , year={2008} } @incollection{b82, , title={{Incremental Blind Feedback: An Effective Approach to Automatic Query Expansion}} , author={{ JHPaik } and { DPal } and { SKParui }} , journal={{ACM Transactions on Asian Language Information Processing (TALIP)}} 13 3 , year={2014} } @incollection{b83, , title={{Selected New Training Documents to Update User profile}} , author={{ AAlgarni } and { YLi } and { YXu }} , booktitle={{Proceedings of the 19 th ACM International Conference on Information and Knowledge Management}} the 19 th ACM International Conference on Information and Knowledge Management , year={2010} } @incollection{b84, , title={{A Survey on Text Categorization}} , author={{ SNiharika } and { VSLatha } and { DLavanya }} , journal={{International Journal of Computer Trends and Technology}} 3 1 , year={2012} } @incollection{b85, , title={{Machine Learning in Automated Text Categorization}} , author={{ FSebastiani }} , journal={{ACM Computing Surveys (CSUR)}} 34 1 , year={2002} } @incollection{b86, , title={{A Survey on Text Mining in Social Networks}} , author={{ RIrfan } and { CKKing } and { DGrages } and { SEwen } and { SUKhan } and { SAMadani } and { JKolodziej } and { LWang } and { DChen } and { ARayes }} , journal={{The Knowledge Engineering Review}} 30 2 , year={2015} } @incollection{b87, , title={{Automatic Extraction of Text Regions from Document Images by Multilevel Thresholding and kmeans Clustering}} , author={{ HNVu } and { TATran } and { ISNa } and { SHKim }} , booktitle={{Proceedings of IEEE/ACIS 14th International Conference on Computer and Information Science (ICIS)}} IEEE/ACIS 14th International Conference on Computer and Information Science (ICIS) , year={2015} } @incollection{b88, , title={{Automatically Mining Facets for Queries from Their Search Results}} , author={{ ZDou } and { ZJiang } and { SHu } and { J.-RWen } and { RSong }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 28 2 , year={2016} } @incollection{b89, , title={{Query Click and Text Similarity Graph for Query Suggestions}} , author={{ ASejal } and { KShailesh } and { VTejaswi } and { DAnvekar } and { KRVenugopal } and { SIyengar } and { LPatnaik }} , booktitle={{International Workshop on Machine Learning and Data Mining in Pattern Recognition}} , year={2015} } @incollection{b90, , title={{Mining Related Queries from Web Search Engine Query Logs using an Improved Association Rule Mining Model}} , author={{ XShi } and { CCYang }} , journal={{Journal of the American Society for Information Science and Technology}} 58 12 , year={2007} } @incollection{b91, , title={{Faceted Search and Browsing of Audio Content on Spoken Web}} , author={{ MDiao } and { SMukherjea } and { NRajput } and { KSrivastava }} , booktitle={{Proceedings of the 19th ACM International Conference on Information and Knowledge Management}} the 19th ACM International Conference on Information and Knowledge Management , year={2010} } @incollection{b92, , title={{Efficient Processing of Relevant Nearest-Neighbor Queries}} , author={{ CEfstathiades } and { AEfentakis } and { DPfoser }} , journal={{ACM Transactions on Spatial Algorithms and Systems (TSAS)}} 2 3 , year={2016} } @incollection{b93, , title={{Inverted Linear Quadtree: Efficient Top k Spatial Keyword S219219earch}} , author={{ CZhang } and { YZhang } and { WZhang } and { XLin }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 28 7 , year={2016} } @incollection{b94, , title={{Timeand Space-Efficient Sliding Window Top-k Query Processi-ng}} , author={{ KPripu?zi´c } and { IPZarko } and { KAberer }} , journal={{ACM Transactions on Database Systems (TODS)}} 40 1 , year={2015} } @incollection{b95, , title={{Space-Efficient Frameworks for Top-k String Retrieval}} , author={{ W.-KHon } and { RShah } and { SVThankachan } and { JSVitter }} , journal={{Journal of the ACM (JACM)}} 61 2 , year={2014} } @incollection{b96, , title={{Extending Faceted Search to the General Web}} , author={{ WKong } and { JAllan }} , booktitle={{Proceedings of the 23rd ACM International Conference on Information and Knowledge Management}} the 23rd ACM International Conference on Information and Knowledge Management , year={2014} } @incollection{b97, , title={{Ranking Related Entities: Components and Analyses}} , author={{ MBron } and { KBalog } and { MDe Rijke }} , booktitle={{Proceedings of the 19 th ACM International Conference on Information and Knowledge Management}} the 19 th ACM International Conference on Information and Knowledge Management , year={2010} } @incollection{b98, , title={{Spaces, Trees, and Colors: The Algorithmic Landscape of Document Retrieval on Sequences}} , author={{ GNavarro }} , journal={{ACM Computing Surveys (CSUR)}} 46 4 , year={2014} } @incollection{b99, , title={{Exploring Topical Lead-Lag Across Corpora}} , author={{ SLiu } and { YChen } and { HWei } and { JYang } and { KZhou } and { SMDrucker }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 27 1 , year={2015} } @incollection{b100, , title={{Cross-Lingual Topic Discovery from Multilingual Search Engine Query Log}} , author={{ DJiang } and { YTong } and { YSong }} , journal={{ACM Transactions on Information Systems (TOIS)}} 35 2 , year={2016} } @incollection{b101, , title={{Webtables: Exploring the Power of Tables on the Web}} , author={{ MJCafarella } and { AHalevy } and { DZWang } and { EWu } and { YZhang }} , booktitle={{Proceedings of the VLDB Data to find Endowment}} the VLDB Data to find Endowment , year={2008} 1 } @incollection{b102, , title={{Facet Discovery for Structured Web Search: A Query-Log Mining Approach}} , author={{ JPound } and { SPaparizos } and { PTsaparas }} , booktitle={{Proceedings of the ACM SIGMOD International Conference on Management of Data}} the ACM SIGMOD International Conference on Management of Data , year={2011} } @incollection{b103, , title={{Static Index Pruning in Web Search Engines: Combining Term and Document Popularities with Query Views}} , author={{ ISAltingovde } and { ROzcan } and { O¨Ulusoy }} , journal={{ACM Transactions on Information Systems (TOIS)}} 30 1 , year={2012} } @incollection{b104, , title={{Query-Based Data Pricing}} , author={{ PKoutris } and { PUpadhyaya } and { MBalazinska } and { BHowe } and { DSuciu }} , journal={{Journal of the ACM (JACM)}} 62 5 , year={2015} } @incollection{b105, , title={{Discovering Tasks from Search Engine Query Logs}} , author={{ CLucchese } and { SOrlando } and { RPerego } and { FSilvestri } and { GTolomei }} , journal={{ACM Transactions on Information Systems (TOIS)}} 31 3 , year={2013} } @incollection{b106, , title={{Differentiating Search Results on Structured Data}} , author={{ ZLiu } and { YChen }} , journal={{ACM Transactions on Database Systems (TODS)}} 37 1 , year={2012} } @incollection{b107, , title={{Visual Abstraction and Ordering in Faceted Browsing of Text Collections}} , author={{ VThai } and { P.-YRouille } and { SHandschuh }} , journal={{ACM Transactions on Intelligent Systems and Technology (TIST)}} 3 2 , year={2012} } @incollection{b108, , title={{Top-k Diversity Queries Over Bounded Regions}} , author={{ ECatallo } and { PCiceri } and { DFraternali } and { MMartinenghi } and { Tagliasacchi }} , journal={{ACM Transactions on Database Systems (TODS)}} 38 2 , year={2013} } @incollection{b109, , title={{Efficient Fuzzy Search in Large Text Collections}} , author={{ HBast } and { MCelikik }} , journal={{ACM Transactions on Information Systems (TOIS)}} 31 2 , year={2013} } @incollection{b110, , title={{Using Structural Information in Xml Keyword Search Effectively}} , author={{ ATermehchy } and { MWinslett }} , journal={{ACM Transactions on Database Systems (TODS)}} 36 1 , year={2011} } @incollection{b111, , title={{On Multiple Keyword Sponsored Search Auctions with Budgets}} , author={{ RColini-Baldeschi } and { SLeonardi } and { MHenzinger } and { MStarnberger }} , journal={{ACM Transactions on Economics and Computation}} 4 1 , year={2016} } @incollection{b112, , title={{The Effects of Aggregated Search Coherence on Search Behavior}} , author={{ RArguello } and { Capra }} , journal={{ACM Transactions on Information Systems (TOIS)}} 35 1 , year={2016} } @incollection{b113, , title={{Moving Spatial Keyword Queries: Formulation, Methods, and Analysis}} , author={{ DWu } and { MLYiu } and { CSJensen }} , journal={{ACM Transactions on Database Systems (TODS)}} 38 1 , year={2013} } @book{b114, , title={{Efficient Algorithms and Cost Models for Reverse Spatial-Keyword K Nearest Neighbor Search}} , author={{ YLu } and { JLu } and { GCong } and { WWu } and { CShahabi }} , publisher={ACM} } @incollection{b115, , title={{Efficient Processing of Spatial Group Keyword Queries}} , author={{ XCao } and { GCong } and { TGuo } and { CSJensen } and { BCOoi }} , journal={{ACM Transactions on Database Systems (TODS)}} 40 2 , year={2015} } @incollection{b116, , title={{Fine-Grained Knowledge Sharing in Collaborative Environments}} , author={{ ZGuan } and { SYang } and { HSun } and { MSrivatsa } and { XYan }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 27 8 , year={2015} } @incollection{b117, , title={{Learning to Extract Cross-Session Search Tasks}} , author={{ HWang } and { YSong } and { M.-WChang } and { XHe } and { RWWhite } and { WChu }} , booktitle={{Proceedings of the 22nd International Conference on World Wide Web}} the 22nd International Conference on World Wide Web , year={2013} } @incollection{b118, , title={{Modeling and Analysis of Cross-Session Search Tasks}} , author={{ AKotov } and { PNBennett } and { RWWhite } and { STDumais } and { JTeevan }} , booktitle={{Proceedings of the 34th International ACM SIGIR Conference on Research and Development in Information Retrieval}} the 34th International ACM SIGIR Conference on Research and Development in Information Retrieval , year={2011} } @incollection{b119, , title={{Progressive Duplicate Detection}} , author={{ TPapenbrock } and { AHeise } and { FNaumann }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 27 5 , year={2015} } @incollection{b120, , title={{Innovative Windows for Duplicate Detection}} , author={{ HBano } and { FAzam }} , journal={{International Journal of Software Engineering and Its Applications}} 9 1 , year={2015} } @incollection{b121, , title={{Propagation of Data Fusion}} , author={{ ABronselaer } and { DVan Britsom } and { GDe Tre }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 27 5 , year={2015} } @incollection{b122, , title={{A Blocking Framework for Entity Resolution in}} , author={{ GPapadakis } and { EIoannou } and { TPalpanas } and { CNieder´ee } and { WNejdl }} , booktitle={{Highly Heterogeneous C Transactions on Database Systems (TODS)}} , year={2014. 2013} 39 , note={Information Spaces} } @incollection{b123, , title={{Efficient Entity Resolution Methods for Heterogeneous Information Spaces}} , author={{ GPapadakis } and { WNejdl }} , booktitle={{Proceedings of IEEE 27th International Conference on Data Engineering Workshops (ICDEW)}} IEEE 27th International Conference on Data Engineering Workshops (ICDEW) , year={2011} } @incollection{b124, , title={{Framework for Evaluating Clustering Algorithms in Duplicate Detection}} , author={{ OHassanzadeh } and { FChiang } and { HCLee } and { RJMiller }} , booktitle={{Proceedings of the VLDB Endowment}} the VLDB Endowment , year={2009} 2 } @incollection{b125, , title={{Pay-asyougo Entity Resolution}} , author={{ SEWhang } and { DMarmaros } and { HGarcia-Molina }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 25 5 , year={2013} } @incollection{b126, , title={{A Survey on Various Methods used for Detecting Duplicates in 127}} , author={{ AAAbraham } and { SDKanmani } and { ; JJTamilselvi } and { CBGifta }} , journal={{International Journal of Computer Applications}} 15 4 , year={2011} , note={Handling Duplicate Data in Data Warehouse for Data Mining} } @incollection{b127, , title={{Duplicate Record Detection: A Survey}} , author={{ AKElmagarmid } and { PGIpeirotis } and { VSVerykios }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 19 1 , year={2007} } @incollection{b128, , title={{A Survey of Indexing Techniques for Scalable Record Linkage and Deduplication}} , author={{ PChristen }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 24 9 , year={2012} } @incollection{b129, , title={{Robust Record Linkage Blocking using Suffix Arrays and Bloom Filters}} , author={{ TDeVries } and { HKe } and { SChawla } and { PChristen }} , journal={{ACM Transactions on Knowledge Discovery from Data (TKDD)}} 5 2 , year={2011} } @incollection{b130, , title={{Creating Probabilistic Databases from Duplicated Data}} , author={{ OHassanzadeh } and { RJMiller }} , booktitle={{The VLDB Journal-The International Journal on Very Large Data Bases}} , year={2009} 18 } @incollection{b131, , title={{Aspects of object Merging}} , author={{ ABronselaer } and { GDe Tr´e }} , booktitle={{Annual Meeting of the North American Fuzzy Information Processing Society (NAFIPS)}} , year={2010} } @incollection{b132, , title={{Adaptive Windows for Duplicate Detection}} , author={{ UDraisbach } and { FNaumann } and { SSzott } and { OWonneberg }} , booktitle={{Proceedings of IEEE 28th International Conference on Data Engineering (ICDE)}} IEEE 28th International Conference on Data Engineering (ICDE) , year={2012} } @incollection{b133, , title={{Data Fusion in Three Steps: Resolving Schema, Tuple, and Value Inconsistencies}} , author={{ FNaumann } and { ABilke } and { JBleiholder } and { MWeis }} , journal={{International Journal of Engineering Research and Technology}} 3 1 , year={2014. 2006} , note={Engineering and Management} } @incollection{b134, , title={{Data Fusion}} , author={{ JBleiholder } and { FNaumann }} , journal={{ACM Computing Surveys (CSUR)}} 41 1 , year={2009} } @incollection{b135, , title={{Semi-Supervised Heterogeneous Fusion for Multimedia Data Co-Clustering}} , author={{ LMeng } and { A.-HTan } and { DXu }} , journal={{IEEE Transactions on Knowledge and Data Engineering}} 26 9 , year={2014} }