<html xmlns:v="urn:schemas-microsoft-com:vml"
xmlns:o="urn:schemas-microsoft-com:office:office"
xmlns:w="urn:schemas-microsoft-com:office:word"
xmlns:m="http://schemas.microsoft.com/office/2004/12/omml"
xmlns:mv="http://macVmlSchemaUri" xmlns="http://www.w3.org/TR/REC-html40"
xmlns:ns0="urn:schemas-microsoft-com:office:smarttags">

<head>
<meta name=Title content="W.G.Aref NSF-IDM/CAREER">
<meta name=Keywords content="">
<meta http-equiv=Content-Type content="text/html; charset=unicode">
<meta name=ProgId content=Word.Document>
<meta name=Generator content="Microsoft Word 14">
<meta name=Originator content="Microsoft Word 14">
<link rel=File-List href="dbsystems2014-3_files/filelist.xml">
<title>W.G.Aref NSF-IDM/CAREER</title>
<!--[if gte mso 9]><xml>
 <o:DocumentProperties>
  <o:Author>aref</o:Author>
  <o:Template>Normal</o:Template>
  <o:LastAuthor>Walid Aref</o:LastAuthor>
  <o:Revision>20</o:Revision>
  <o:TotalTime>785</o:TotalTime>
  <o:Created>2015-02-02T20:46:00Z</o:Created>
  <o:LastSaved>2016-04-11T23:11:00Z</o:LastSaved>
  <o:Pages>9</o:Pages>
  <o:Words>11550</o:Words>
  <o:Characters>65841</o:Characters>
  <o:Company>Purdue University</o:Company>
  <o:Lines>548</o:Lines>
  <o:Paragraphs>154</o:Paragraphs>
  <o:CharactersWithSpaces>77237</o:CharactersWithSpaces>
  <o:Version>14.0</o:Version>
 </o:DocumentProperties>
 <o:OfficeDocumentSettings>
  <o:AllowPNG/>
 </o:OfficeDocumentSettings>
</xml><![endif]-->
<link rel=themeData href="dbsystems2014-3_files/themedata.xml">
<!--[if gte mso 9]><xml>
 <w:WordDocument>
  <w:Zoom>200</w:Zoom>
  <w:SpellingState>Clean</w:SpellingState>
  <w:GrammarState>Clean</w:GrammarState>
  <w:TrackMoves/>
  <w:TrackFormatting/>
  <w:ValidateAgainstSchemas/>
  <w:SaveIfXMLInvalid>false</w:SaveIfXMLInvalid>
  <w:IgnoreMixedContent>false</w:IgnoreMixedContent>
  <w:AlwaysShowPlaceholderText>false</w:AlwaysShowPlaceholderText>
  <w:DoNotPromoteQF/>
  <w:LidThemeOther>EN-US</w:LidThemeOther>
  <w:LidThemeAsian>JA</w:LidThemeAsian>
  <w:LidThemeComplexScript>X-NONE</w:LidThemeComplexScript>
  <w:Compatibility>
   <w:SplitPgBreakAndParaMark/>
  </w:Compatibility>
  <m:mathPr>
   <m:mathFont m:val="Cambria Math"/>
   <m:brkBin m:val="before"/>
   <m:brkBinSub m:val="&#45;-"/>
   <m:smallFrac m:val="off"/>
   <m:dispDef/>
   <m:lMargin m:val="0"/>
   <m:rMargin m:val="0"/>
   <m:defJc m:val="centerGroup"/>
   <m:wrapIndent m:val="1440"/>
   <m:intLim m:val="subSup"/>
   <m:naryLim m:val="undOvr"/>
  </m:mathPr></w:WordDocument>
</xml><![endif]--><!--[if gte mso 9]><xml>
 <w:LatentStyles DefLockedState="false" DefUnhideWhenUsed="false"
  DefSemiHidden="false" DefQFormat="false" LatentStyleCount="276">
  <w:LsdException Locked="false" QFormat="true" Name="Normal"/>
  <w:LsdException Locked="false" QFormat="true" Name="heading 1"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   QFormat="true" Name="heading 2"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   QFormat="true" Name="heading 3"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   QFormat="true" Name="heading 4"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   QFormat="true" Name="heading 5"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   QFormat="true" Name="heading 6"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   QFormat="true" Name="heading 7"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   QFormat="true" Name="heading 8"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   QFormat="true" Name="heading 9"/>
  <w:LsdException Locked="false" Priority="99" Name="header"/>
  <w:LsdException Locked="false" Priority="99" Name="footer"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   QFormat="true" Name="caption"/>
  <w:LsdException Locked="false" QFormat="true" Name="Title"/>
  <w:LsdException Locked="false" Priority="1" Name="Default Paragraph Font"/>
  <w:LsdException Locked="false" QFormat="true" Name="Subtitle"/>
  <w:LsdException Locked="false" QFormat="true" Name="Strong"/>
  <w:LsdException Locked="false" QFormat="true" Name="Emphasis"/>
  <w:LsdException Locked="false" Priority="99" Name="Document Map"/>
  <w:LsdException Locked="false" Priority="99" Name="Plain Text"/>
  <w:LsdException Locked="false" Priority="99" Name="Normal (Web)"/>
  <w:LsdException Locked="false" Priority="99" Name="No List"/>
  <w:LsdException Locked="false" Priority="99" SemiHidden="true"
   UnhideWhenUsed="true" Name="Note Level 1"/>
  <w:LsdException Locked="false" Priority="99" SemiHidden="true"
   UnhideWhenUsed="true" Name="Note Level 2"/>
  <w:LsdException Locked="false" Priority="99" SemiHidden="true"
   UnhideWhenUsed="true" Name="Note Level 3"/>
  <w:LsdException Locked="false" Priority="99" SemiHidden="true"
   UnhideWhenUsed="true" Name="Note Level 4"/>
  <w:LsdException Locked="false" Priority="99" SemiHidden="true"
   UnhideWhenUsed="true" Name="Note Level 5"/>
  <w:LsdException Locked="false" Priority="99" SemiHidden="true"
   UnhideWhenUsed="true" Name="Note Level 6"/>
  <w:LsdException Locked="false" Priority="99" SemiHidden="true"
   UnhideWhenUsed="true" Name="Note Level 7"/>
  <w:LsdException Locked="false" Priority="99" SemiHidden="true"
   UnhideWhenUsed="true" Name="Note Level 8"/>
  <w:LsdException Locked="false" Priority="99" SemiHidden="true"
   UnhideWhenUsed="true" Name="Note Level 9"/>
  <w:LsdException Locked="false" Priority="99" SemiHidden="true"
   Name="Placeholder Text"/>
  <w:LsdException Locked="false" Priority="1" QFormat="true" Name="No Spacing"/>
  <w:LsdException Locked="false" Priority="60" Name="Light Shading"/>
  <w:LsdException Locked="false" Priority="61" Name="Light List"/>
  <w:LsdException Locked="false" Priority="62" Name="Light Grid"/>
  <w:LsdException Locked="false" Priority="63" Name="Medium Shading 1"/>
  <w:LsdException Locked="false" Priority="64" Name="Medium Shading 2"/>
  <w:LsdException Locked="false" Priority="65" Name="Medium List 1"/>
  <w:LsdException Locked="false" Priority="66" Name="Medium List 2"/>
  <w:LsdException Locked="false" Priority="67" Name="Medium Grid 1"/>
  <w:LsdException Locked="false" Priority="68" Name="Medium Grid 2"/>
  <w:LsdException Locked="false" Priority="69" Name="Medium Grid 3"/>
  <w:LsdException Locked="false" Priority="70" Name="Dark List"/>
  <w:LsdException Locked="false" Priority="71" Name="Colorful Shading"/>
  <w:LsdException Locked="false" Priority="72" Name="Colorful List"/>
  <w:LsdException Locked="false" Priority="73" Name="Colorful Grid"/>
  <w:LsdException Locked="false" Priority="60" Name="Light Shading Accent 1"/>
  <w:LsdException Locked="false" Priority="61" Name="Light List Accent 1"/>
  <w:LsdException Locked="false" Priority="62" Name="Light Grid Accent 1"/>
  <w:LsdException Locked="false" Priority="63" Name="Medium Shading 1 Accent 1"/>
  <w:LsdException Locked="false" Priority="64" Name="Medium Shading 2 Accent 1"/>
  <w:LsdException Locked="false" Priority="65" Name="Medium List 1 Accent 1"/>
  <w:LsdException Locked="false" Priority="99" SemiHidden="true" Name="Revision"/>
  <w:LsdException Locked="false" Priority="34" QFormat="true"
   Name="List Paragraph"/>
  <w:LsdException Locked="false" Priority="29" QFormat="true" Name="Quote"/>
  <w:LsdException Locked="false" Priority="30" QFormat="true"
   Name="Intense Quote"/>
  <w:LsdException Locked="false" Priority="66" Name="Medium List 2 Accent 1"/>
  <w:LsdException Locked="false" Priority="67" Name="Medium Grid 1 Accent 1"/>
  <w:LsdException Locked="false" Priority="68" Name="Medium Grid 2 Accent 1"/>
  <w:LsdException Locked="false" Priority="69" Name="Medium Grid 3 Accent 1"/>
  <w:LsdException Locked="false" Priority="70" Name="Dark List Accent 1"/>
  <w:LsdException Locked="false" Priority="71" Name="Colorful Shading Accent 1"/>
  <w:LsdException Locked="false" Priority="72" Name="Colorful List Accent 1"/>
  <w:LsdException Locked="false" Priority="73" Name="Colorful Grid Accent 1"/>
  <w:LsdException Locked="false" Priority="60" Name="Light Shading Accent 2"/>
  <w:LsdException Locked="false" Priority="61" Name="Light List Accent 2"/>
  <w:LsdException Locked="false" Priority="62" Name="Light Grid Accent 2"/>
  <w:LsdException Locked="false" Priority="63" Name="Medium Shading 1 Accent 2"/>
  <w:LsdException Locked="false" Priority="64" Name="Medium Shading 2 Accent 2"/>
  <w:LsdException Locked="false" Priority="65" Name="Medium List 1 Accent 2"/>
  <w:LsdException Locked="false" Priority="66" Name="Medium List 2 Accent 2"/>
  <w:LsdException Locked="false" Priority="67" Name="Medium Grid 1 Accent 2"/>
  <w:LsdException Locked="false" Priority="68" Name="Medium Grid 2 Accent 2"/>
  <w:LsdException Locked="false" Priority="69" Name="Medium Grid 3 Accent 2"/>
  <w:LsdException Locked="false" Priority="70" Name="Dark List Accent 2"/>
  <w:LsdException Locked="false" Priority="71" Name="Colorful Shading Accent 2"/>
  <w:LsdException Locked="false" Priority="72" Name="Colorful List Accent 2"/>
  <w:LsdException Locked="false" Priority="73" Name="Colorful Grid Accent 2"/>
  <w:LsdException Locked="false" Priority="60" Name="Light Shading Accent 3"/>
  <w:LsdException Locked="false" Priority="61" Name="Light List Accent 3"/>
  <w:LsdException Locked="false" Priority="62" Name="Light Grid Accent 3"/>
  <w:LsdException Locked="false" Priority="63" Name="Medium Shading 1 Accent 3"/>
  <w:LsdException Locked="false" Priority="64" Name="Medium Shading 2 Accent 3"/>
  <w:LsdException Locked="false" Priority="65" Name="Medium List 1 Accent 3"/>
  <w:LsdException Locked="false" Priority="66" Name="Medium List 2 Accent 3"/>
  <w:LsdException Locked="false" Priority="67" Name="Medium Grid 1 Accent 3"/>
  <w:LsdException Locked="false" Priority="68" Name="Medium Grid 2 Accent 3"/>
  <w:LsdException Locked="false" Priority="69" Name="Medium Grid 3 Accent 3"/>
  <w:LsdException Locked="false" Priority="70" Name="Dark List Accent 3"/>
  <w:LsdException Locked="false" Priority="71" Name="Colorful Shading Accent 3"/>
  <w:LsdException Locked="false" Priority="72" Name="Colorful List Accent 3"/>
  <w:LsdException Locked="false" Priority="73" Name="Colorful Grid Accent 3"/>
  <w:LsdException Locked="false" Priority="60" Name="Light Shading Accent 4"/>
  <w:LsdException Locked="false" Priority="61" Name="Light List Accent 4"/>
  <w:LsdException Locked="false" Priority="62" Name="Light Grid Accent 4"/>
  <w:LsdException Locked="false" Priority="63" Name="Medium Shading 1 Accent 4"/>
  <w:LsdException Locked="false" Priority="64" Name="Medium Shading 2 Accent 4"/>
  <w:LsdException Locked="false" Priority="65" Name="Medium List 1 Accent 4"/>
  <w:LsdException Locked="false" Priority="66" Name="Medium List 2 Accent 4"/>
  <w:LsdException Locked="false" Priority="67" Name="Medium Grid 1 Accent 4"/>
  <w:LsdException Locked="false" Priority="68" Name="Medium Grid 2 Accent 4"/>
  <w:LsdException Locked="false" Priority="69" Name="Medium Grid 3 Accent 4"/>
  <w:LsdException Locked="false" Priority="70" Name="Dark List Accent 4"/>
  <w:LsdException Locked="false" Priority="71" Name="Colorful Shading Accent 4"/>
  <w:LsdException Locked="false" Priority="72" Name="Colorful List Accent 4"/>
  <w:LsdException Locked="false" Priority="73" Name="Colorful Grid Accent 4"/>
  <w:LsdException Locked="false" Priority="60" Name="Light Shading Accent 5"/>
  <w:LsdException Locked="false" Priority="61" Name="Light List Accent 5"/>
  <w:LsdException Locked="false" Priority="62" Name="Light Grid Accent 5"/>
  <w:LsdException Locked="false" Priority="63" Name="Medium Shading 1 Accent 5"/>
  <w:LsdException Locked="false" Priority="64" Name="Medium Shading 2 Accent 5"/>
  <w:LsdException Locked="false" Priority="65" Name="Medium List 1 Accent 5"/>
  <w:LsdException Locked="false" Priority="66" Name="Medium List 2 Accent 5"/>
  <w:LsdException Locked="false" Priority="67" Name="Medium Grid 1 Accent 5"/>
  <w:LsdException Locked="false" Priority="68" Name="Medium Grid 2 Accent 5"/>
  <w:LsdException Locked="false" Priority="69" Name="Medium Grid 3 Accent 5"/>
  <w:LsdException Locked="false" Priority="70" Name="Dark List Accent 5"/>
  <w:LsdException Locked="false" Priority="71" Name="Colorful Shading Accent 5"/>
  <w:LsdException Locked="false" Priority="72" Name="Colorful List Accent 5"/>
  <w:LsdException Locked="false" Priority="73" Name="Colorful Grid Accent 5"/>
  <w:LsdException Locked="false" Priority="60" Name="Light Shading Accent 6"/>
  <w:LsdException Locked="false" Priority="61" Name="Light List Accent 6"/>
  <w:LsdException Locked="false" Priority="62" Name="Light Grid Accent 6"/>
  <w:LsdException Locked="false" Priority="63" Name="Medium Shading 1 Accent 6"/>
  <w:LsdException Locked="false" Priority="64" Name="Medium Shading 2 Accent 6"/>
  <w:LsdException Locked="false" Priority="65" Name="Medium List 1 Accent 6"/>
  <w:LsdException Locked="false" Priority="66" Name="Medium List 2 Accent 6"/>
  <w:LsdException Locked="false" Priority="67" Name="Medium Grid 1 Accent 6"/>
  <w:LsdException Locked="false" Priority="68" Name="Medium Grid 2 Accent 6"/>
  <w:LsdException Locked="false" Priority="69" Name="Medium Grid 3 Accent 6"/>
  <w:LsdException Locked="false" Priority="70" Name="Dark List Accent 6"/>
  <w:LsdException Locked="false" Priority="71" Name="Colorful Shading Accent 6"/>
  <w:LsdException Locked="false" Priority="72" Name="Colorful List Accent 6"/>
  <w:LsdException Locked="false" Priority="73" Name="Colorful Grid Accent 6"/>
  <w:LsdException Locked="false" Priority="19" QFormat="true"
   Name="Subtle Emphasis"/>
  <w:LsdException Locked="false" Priority="21" QFormat="true"
   Name="Intense Emphasis"/>
  <w:LsdException Locked="false" Priority="31" QFormat="true"
   Name="Subtle Reference"/>
  <w:LsdException Locked="false" Priority="32" QFormat="true"
   Name="Intense Reference"/>
  <w:LsdException Locked="false" Priority="33" QFormat="true" Name="Book Title"/>
  <w:LsdException Locked="false" Priority="37" SemiHidden="true"
   UnhideWhenUsed="true" Name="Bibliography"/>
  <w:LsdException Locked="false" Priority="39" SemiHidden="true"
   UnhideWhenUsed="true" QFormat="true" Name="TOC Heading"/>
 </w:LatentStyles>
</xml><![endif]-->
<style>
<!--
 /* Font Definitions */
@font-face
	{font-family:"Courier New";
	panose-1:2 7 3 9 2 2 5 2 4 4;
	mso-font-charset:0;
	mso-generic-font-family:auto;
	mso-font-pitch:variable;
	mso-font-signature:-536859905 -1073711037 9 0 511 0;}
@font-face
	{font-family:Wingdings;
	panose-1:5 0 0 0 0 0 0 0 0 0;
	mso-font-charset:2;
	mso-generic-font-family:auto;
	mso-font-pitch:variable;
	mso-font-signature:0 268435456 0 0 -2147483648 0;}
@font-face
	{font-family:"ＭＳ 明朝";
	mso-font-charset:78;
	mso-generic-font-family:auto;
	mso-font-pitch:variable;
	mso-font-signature:-536870145 1791491579 18 0 131231 0;}
@font-face
	{font-family:"ＭＳ 明朝";
	mso-font-charset:78;
	mso-generic-font-family:auto;
	mso-font-pitch:variable;
	mso-font-signature:-536870145 1791491579 18 0 131231 0;}
@font-face
	{font-family:"Lucida Grande";
	panose-1:2 11 6 0 4 5 2 2 2 4;
	mso-font-charset:0;
	mso-generic-font-family:auto;
	mso-font-pitch:variable;
	mso-font-signature:-520090897 1342218751 0 0 447 0;}
@font-face
	{font-family:Tahoma;
	panose-1:2 11 6 4 3 5 4 4 2 4;
	mso-font-charset:0;
	mso-generic-font-family:auto;
	mso-font-pitch:variable;
	mso-font-signature:-520082689 -1073717157 41 0 66047 0;}
 /* Style Definitions */
p.MsoNormal, li.MsoNormal, div.MsoNormal
	{mso-style-unhide:no;
	mso-style-qformat:yes;
	mso-style-parent:"";
	margin:0in;
	margin-bottom:.0001pt;
	mso-pagination:widow-orphan;
	font-size:12.0pt;
	font-family:"Times New Roman";
	mso-fareast-font-family:"Times New Roman";}
p.MsoHeader, li.MsoHeader, div.MsoHeader
	{mso-style-priority:99;
	mso-style-unhide:no;
	mso-style-link:"Header Char";
	margin:0in;
	margin-bottom:.0001pt;
	mso-pagination:widow-orphan;
	tab-stops:center 3.0in right 6.0in;
	font-size:12.0pt;
	font-family:"Times New Roman";
	mso-fareast-font-family:"Times New Roman";}
p.MsoFooter, li.MsoFooter, div.MsoFooter
	{mso-style-priority:99;
	mso-style-unhide:no;
	mso-style-link:"Footer Char";
	margin:0in;
	margin-bottom:.0001pt;
	mso-pagination:widow-orphan;
	tab-stops:center 3.0in right 6.0in;
	font-size:12.0pt;
	font-family:"Times New Roman";
	mso-fareast-font-family:"Times New Roman";}
a:link, span.MsoHyperlink
	{mso-style-unhide:no;
	color:blue;
	text-decoration:underline;
	text-underline:single;}
a:visited, span.MsoHyperlinkFollowed
	{mso-style-unhide:no;
	color:purple;
	text-decoration:underline;
	text-underline:single;}
p.MsoDocumentMap, li.MsoDocumentMap, div.MsoDocumentMap
	{mso-style-priority:99;
	mso-style-unhide:no;
	mso-style-link:"Document Map Char";
	margin:0in;
	margin-bottom:.0001pt;
	mso-pagination:widow-orphan;
	background:navy;
	font-size:12.0pt;
	font-family:Tahoma;
	mso-fareast-font-family:"Times New Roman";
	mso-bidi-font-family:"Times New Roman";}
p.MsoPlainText, li.MsoPlainText, div.MsoPlainText
	{mso-style-priority:99;
	mso-style-unhide:no;
	mso-style-link:"Plain Text Char";
	margin:0in;
	margin-bottom:.0001pt;
	mso-pagination:widow-orphan;
	font-size:10.0pt;
	font-family:"Courier New";
	mso-fareast-font-family:"Times New Roman";}
p
	{mso-style-priority:99;
	mso-style-unhide:no;
	mso-margin-top-alt:auto;
	margin-right:0in;
	mso-margin-bottom-alt:auto;
	margin-left:0in;
	mso-pagination:widow-orphan;
	font-size:12.0pt;
	font-family:"Times New Roman";
	mso-fareast-font-family:"Times New Roman";}
pre
	{mso-style-unhide:no;
	mso-style-link:"HTML Preformatted Char";
	margin:0in;
	margin-bottom:.0001pt;
	mso-pagination:widow-orphan;
	tab-stops:45.8pt 91.6pt 137.4pt 183.2pt 229.0pt 274.8pt 320.6pt 366.4pt 412.2pt 458.0pt 503.8pt 549.6pt 595.4pt 641.2pt 687.0pt 732.8pt;
	font-size:10.0pt;
	font-family:"Courier New";
	mso-fareast-font-family:"Courier New";}
p.MsoListParagraph, li.MsoListParagraph, div.MsoListParagraph
	{mso-style-priority:34;
	mso-style-unhide:no;
	mso-style-qformat:yes;
	margin-top:0in;
	margin-right:0in;
	margin-bottom:0in;
	margin-left:.5in;
	margin-bottom:.0001pt;
	mso-add-space:auto;
	mso-pagination:widow-orphan;
	font-size:12.0pt;
	font-family:"Times New Roman";
	mso-fareast-font-family:"Times New Roman";}
p.MsoListParagraphCxSpFirst, li.MsoListParagraphCxSpFirst, div.MsoListParagraphCxSpFirst
	{mso-style-priority:34;
	mso-style-unhide:no;
	mso-style-qformat:yes;
	mso-style-type:export-only;
	margin-top:0in;
	margin-right:0in;
	margin-bottom:0in;
	margin-left:.5in;
	margin-bottom:.0001pt;
	mso-add-space:auto;
	mso-pagination:widow-orphan;
	font-size:12.0pt;
	font-family:"Times New Roman";
	mso-fareast-font-family:"Times New Roman";}
p.MsoListParagraphCxSpMiddle, li.MsoListParagraphCxSpMiddle, div.MsoListParagraphCxSpMiddle
	{mso-style-priority:34;
	mso-style-unhide:no;
	mso-style-qformat:yes;
	mso-style-type:export-only;
	margin-top:0in;
	margin-right:0in;
	margin-bottom:0in;
	margin-left:.5in;
	margin-bottom:.0001pt;
	mso-add-space:auto;
	mso-pagination:widow-orphan;
	font-size:12.0pt;
	font-family:"Times New Roman";
	mso-fareast-font-family:"Times New Roman";}
p.MsoListParagraphCxSpLast, li.MsoListParagraphCxSpLast, div.MsoListParagraphCxSpLast
	{mso-style-priority:34;
	mso-style-unhide:no;
	mso-style-qformat:yes;
	mso-style-type:export-only;
	margin-top:0in;
	margin-right:0in;
	margin-bottom:0in;
	margin-left:.5in;
	margin-bottom:.0001pt;
	mso-add-space:auto;
	mso-pagination:widow-orphan;
	font-size:12.0pt;
	font-family:"Times New Roman";
	mso-fareast-font-family:"Times New Roman";}
span.HTMLPreformattedChar
	{mso-style-name:"HTML Preformatted Char";
	mso-style-unhide:no;
	mso-style-locked:yes;
	mso-style-link:"HTML Preformatted";
	font-family:Courier;
	mso-ascii-font-family:Courier;
	mso-hansi-font-family:Courier;}
span.HeaderChar
	{mso-style-name:"Header Char";
	mso-style-priority:99;
	mso-style-unhide:no;
	mso-style-locked:yes;
	mso-style-link:Header;
	mso-ansi-font-size:12.0pt;
	mso-bidi-font-size:12.0pt;}
span.FooterChar
	{mso-style-name:"Footer Char";
	mso-style-priority:99;
	mso-style-unhide:no;
	mso-style-locked:yes;
	mso-style-link:Footer;
	mso-ansi-font-size:12.0pt;
	mso-bidi-font-size:12.0pt;}
span.DocumentMapChar
	{mso-style-name:"Document Map Char";
	mso-style-priority:99;
	mso-style-unhide:no;
	mso-style-locked:yes;
	mso-style-link:"Document Map";
	mso-ansi-font-size:12.0pt;
	mso-bidi-font-size:12.0pt;
	font-family:"Lucida Grande";
	mso-ascii-font-family:"Lucida Grande";
	mso-hansi-font-family:"Lucida Grande";
	mso-bidi-font-family:"Lucida Grande";}
span.PlainTextChar
	{mso-style-name:"Plain Text Char";
	mso-style-priority:99;
	mso-style-unhide:no;
	mso-style-locked:yes;
	mso-style-link:"Plain Text";
	mso-ansi-font-size:10.5pt;
	mso-bidi-font-size:10.5pt;
	font-family:Courier;
	mso-ascii-font-family:Courier;
	mso-hansi-font-family:Courier;}
span.SpellE
	{mso-style-name:"";
	mso-spl-e:yes;}
span.GramE
	{mso-style-name:"";
	mso-gram-e:yes;}
.MsoChpDefault
	{mso-style-type:export-only;
	mso-default-props:yes;
	font-size:10.0pt;
	mso-ansi-font-size:10.0pt;
	mso-bidi-font-size:10.0pt;}
@page WordSection1
	{size:8.5in 11.0in;
	margin:1.0in 1.25in 1.0in 1.25in;
	mso-header-margin:.5in;
	mso-footer-margin:.5in;
	mso-paper-source:0;}
div.WordSection1
	{page:WordSection1;}
 /* List Definitions */
@list l0
	{mso-list-id:206649861;
	mso-list-type:hybrid;
	mso-list-template-ids:-1423790852 -651512080 67698713 67698715 67698703 67698713 67698715 67698703 67698713 67698715;}
@list l0:level1
	{mso-level-number-format:roman-lower;
	mso-level-text:"\(%1\)";
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	margin-left:.75in;
	text-indent:-.5in;}
@list l0:level2
	{mso-level-number-format:alpha-lower;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;}
@list l0:level3
	{mso-level-number-format:roman-lower;
	mso-level-tab-stop:none;
	mso-level-number-position:right;
	text-indent:-9.0pt;}
@list l0:level4
	{mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;}
@list l0:level5
	{mso-level-number-format:alpha-lower;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;}
@list l0:level6
	{mso-level-number-format:roman-lower;
	mso-level-tab-stop:none;
	mso-level-number-position:right;
	text-indent:-9.0pt;}
@list l0:level7
	{mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;}
@list l0:level8
	{mso-level-number-format:alpha-lower;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;}
@list l0:level9
	{mso-level-number-format:roman-lower;
	mso-level-tab-stop:none;
	mso-level-number-position:right;
	text-indent:-9.0pt;}
@list l1
	{mso-list-id:241916800;
	mso-list-type:hybrid;
	mso-list-template-ids:177775770 1319251368 -811854328 -1613101662 2056039896 -1276621146 -2007885548 -1888862010 2109250946 -155970604;}
@list l1:level1
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:.5in;
	mso-level-number-position:left;
	text-indent:-.25in;
	mso-ansi-font-size:10.0pt;
	font-family:Symbol;}
@list l1:level2
	{mso-level-tab-stop:1.0in;
	mso-level-number-position:left;
	text-indent:-.25in;}
@list l1:level3
	{mso-level-tab-stop:1.5in;
	mso-level-number-position:left;
	text-indent:-.25in;}
@list l1:level4
	{mso-level-tab-stop:2.0in;
	mso-level-number-position:left;
	text-indent:-.25in;}
@list l1:level5
	{mso-level-tab-stop:2.5in;
	mso-level-number-position:left;
	text-indent:-.25in;}
@list l1:level6
	{mso-level-tab-stop:3.0in;
	mso-level-number-position:left;
	text-indent:-.25in;}
@list l1:level7
	{mso-level-tab-stop:3.5in;
	mso-level-number-position:left;
	text-indent:-.25in;}
@list l1:level8
	{mso-level-tab-stop:4.0in;
	mso-level-number-position:left;
	text-indent:-.25in;}
@list l1:level9
	{mso-level-tab-stop:4.5in;
	mso-level-number-position:left;
	text-indent:-.25in;}
@list l2
	{mso-list-id:334461229;
	mso-list-type:hybrid;
	mso-list-template-ids:-926245912 67698703 67698713 67698715 67698703 67698713 67698715 67698703 67698713 67698715;}
@list l2:level1
	{mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;}
@list l2:level2
	{mso-level-number-format:alpha-lower;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;}
@list l2:level3
	{mso-level-number-format:roman-lower;
	mso-level-tab-stop:none;
	mso-level-number-position:right;
	text-indent:-9.0pt;}
@list l2:level4
	{mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;}
@list l2:level5
	{mso-level-number-format:alpha-lower;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;}
@list l2:level6
	{mso-level-number-format:roman-lower;
	mso-level-tab-stop:none;
	mso-level-number-position:right;
	text-indent:-9.0pt;}
@list l2:level7
	{mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;}
@list l2:level8
	{mso-level-number-format:alpha-lower;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;}
@list l2:level9
	{mso-level-number-format:roman-lower;
	mso-level-tab-stop:none;
	mso-level-number-position:right;
	text-indent:-9.0pt;}
@list l3
	{mso-list-id:456797825;
	mso-list-type:hybrid;
	mso-list-template-ids:-1765269152 1458852608 67698691 67698693 67698689 67698691 67698693 67698689 67698691 67698693;}
@list l3:level1
	{mso-level-start-at:2011;
	mso-level-number-format:bullet;
	mso-level-text:-;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:"Times New Roman";
	mso-fareast-font-family:"Times New Roman";}
@list l3:level2
	{mso-level-number-format:bullet;
	mso-level-text:o;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:"Courier New";
	mso-bidi-font-family:"Times New Roman";}
@list l3:level3
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Wingdings;}
@list l3:level4
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Symbol;}
@list l3:level5
	{mso-level-number-format:bullet;
	mso-level-text:o;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:"Courier New";
	mso-bidi-font-family:"Times New Roman";}
@list l3:level6
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Wingdings;}
@list l3:level7
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Symbol;}
@list l3:level8
	{mso-level-number-format:bullet;
	mso-level-text:o;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:"Courier New";
	mso-bidi-font-family:"Times New Roman";}
@list l3:level9
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Wingdings;}
@list l4
	{mso-list-id:1792629923;
	mso-list-type:hybrid;
	mso-list-template-ids:774141380 67698689 67698691 67698693 67698689 67698691 67698693 67698689 67698691 67698693;}
@list l4:level1
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Symbol;}
@list l4:level2
	{mso-level-number-format:bullet;
	mso-level-text:o;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:"Courier New";
	mso-bidi-font-family:"Times New Roman";}
@list l4:level3
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Wingdings;}
@list l4:level4
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Symbol;}
@list l4:level5
	{mso-level-number-format:bullet;
	mso-level-text:o;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:"Courier New";
	mso-bidi-font-family:"Times New Roman";}
@list l4:level6
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Wingdings;}
@list l4:level7
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Symbol;}
@list l4:level8
	{mso-level-number-format:bullet;
	mso-level-text:o;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:"Courier New";
	mso-bidi-font-family:"Times New Roman";}
@list l4:level9
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Wingdings;}
ol
	{margin-bottom:0in;}
ul
	{margin-bottom:0in;}
-->
</style>
<!--[if gte mso 10]>
<style>
 /* Style Definitions */
table.MsoNormalTable
	{mso-style-name:"Table Normal";
	mso-tstyle-rowband-size:0;
	mso-tstyle-colband-size:0;
	mso-style-noshow:yes;
	mso-style-priority:99;
	mso-style-parent:"";
	mso-padding-alt:0in 5.4pt 0in 5.4pt;
	mso-para-margin:0in;
	mso-para-margin-bottom:.0001pt;
	mso-pagination:widow-orphan;
	font-size:10.0pt;
	font-family:"Times New Roman";}
</style>
<![endif]--><!--[if gte mso 9]><xml>
 <o:shapedefaults v:ext="edit" spidmax="1027"/>
</xml><![endif]--><!--[if gte mso 9]><xml>
 <o:shapelayout v:ext="edit">
  <o:idmap v:ext="edit" data="1"/>
 </o:shapelayout></xml><![endif]-->
</head>

<body bgcolor=white lang=EN-US link=blue vlink=purple style='tab-interval:.5in'>

<div class=WordSection1>

<p class=MsoNormal align=center style='text-align:center;mso-outline-level:
1'><span style='font-size:24.0pt'>NSF- III: Small: On the Conceptual Evaluation
and Optimization of Queries in Spatiotemporal Data Systems<o:p></o:p></span></p>

<p align=center style='margin:0in;margin-bottom:.0001pt;text-align:center'><span
style='font-size:10.0pt'><o:p>&nbsp;</o:p></span></p>

<p align=center style='margin:0in;margin-bottom:.0001pt;text-align:center'><span
style='font-size:10.0pt'>Walid G. Aref</span></p>

<p class=MsoNormal align=center style='text-align:center'><span
style='font-size:10.0pt'>Principal Investigator</span></p>

<p align=center style='margin:0in;margin-bottom:.0001pt;text-align:center'><span
style='font-size:10.0pt'>Department of Computer Science</span> <br>
<span style='font-size:10.0pt'>Purdue University<o:p></o:p></span></p>

<p style='margin:0in;margin-bottom:.0001pt'>_<br>
<b><span style='font-size:18.0pt'>Contact Information</span></b> </p>

<p class=MsoNormal><span style='font-size:10.0pt'>Walid G. Aref</span> </p>

<p class=MsoNormal><span style='font-size:10.0pt'>Department of Computer Science<o:p></o:p></span></p>

<p class=MsoNormal><span style='font-size:10.0pt'>Purdue University</span></p>

<p class=MsoNormal><span style='font-size:10.0pt'>305 N. University Street</span></p>

<p class=MsoNormal>West Lafayette, Indiana 47907</p>

<p class=MsoNormal><span lang=FR style='mso-ansi-language:FR'>Phone: (765)
494-1997 <br>
Fax : (765) 494-0739 <br>
Email: aref@cs.purdue.edu <br>
URL: http://www.cs.purdue.edu/faculty/aref.html </span></p>

<p style='mso-outline-level:1'><b><span style='font-size:18.0pt'>Project Award
Information</span></b></p>

<ul type=disc>
 <li class=MsoNormal style='mso-margin-top-alt:auto;mso-margin-bottom-alt:auto;
     mso-list:l1 level1 lfo1;tab-stops:list .5in'><span style='font-size:10.0pt'>Award
     Number: III- 1117766</span></li>
 <li class=MsoNormal style='mso-margin-top-alt:auto;mso-margin-bottom-alt:auto;
     mso-list:l1 level1 lfo1;tab-stops:list .5in'><span style='font-size:10.0pt'>Duration:
     9/1/2011 -- 8/31/2016</span></li>
 <li class=MsoNormal style='mso-margin-top-alt:auto;mso-margin-bottom-alt:auto;
     mso-list:l1 level1 lfo1;tab-stops:list .5in'><span style='font-size:10.0pt'>Title:
     On the Conceptual Evaluation and Optimization of Queries in Spatiotemporal
     Data Systems<o:p></o:p></span></li>
 <li class=MsoNormal style='mso-margin-top-alt:auto;mso-margin-bottom-alt:auto;
     mso-list:l1 level1 lfo1;tab-stops:list .5in'><span style='font-size:10.0pt'>PI:
     Walid G. Aref<o:p></o:p></span></li>
</ul>

<p style='mso-outline-level:1'><b><span style='font-size:18.0pt'>Project Web
Page:</span></b><span lang=FR style='mso-ansi-language:FR'> <br>
</span><span lang=FR style='font-size:10.0pt;mso-ansi-language:FR'>http://www.cs.purdue.edu/homes/aref/dbsystems2014-3.htm</span><span
lang=FR style='mso-ansi-language:FR'><o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b><span lang=FR style='font-size:18.0pt;mso-ansi-language:
FR'>Project Focus: <o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>The widespread use of smart-phones, social networks, and
location devices has given rise to a wide spectrum of location-based
applications and services. Along with the advancement and ubiquity of
location-based applications and services, users' queries and needs are
consistently growing in complexity and are becoming very sophisticated. Current
location-based query systems offer shallow query interface capabilities that do
not match users' expectations. This project identifies and addresses the
challenges in correctly expressing and efficiently executing complex
location-based queries. A user's query can get arbitrarily complex having a
combination of multiple location-based, relational, and textual operations,
e.g., location-based selections, spatial joins, relational selections,
relational joins, relational group-<span class=SpellE>by's</span>, etc. Current
location-based query systems support only one location-based operator, e.g.,
range queries or nearby queries (k-Nearest-Neighbors, or <span class=SpellE>kNN</span>,
for short). Our focus is to develop a query system, termed the multi-predicate
location-based query processing <span class=GramE>system, that</span> supports
any combination of location-based, relational, and textual operations.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><span style='font-size:10.0pt'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b><span lang=FR style='font-size:18.0pt;mso-ansi-language:
FR'>Progress:<o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>In the initial phase of this project, we are able to
identify location-based application scenarios and their associated queries that
current state-of-the-art location-based query systems cannot handle. We
isolate, identify, and classify the reasons and ingredients for what makes
these queries hard to handle. The first class of such queries is one that
involves two k-nearest-neighbor operators. We term this class of queries as the
2-kNN queries. Many application scenarios call for this type of queries. We
highlight several examples in our [VLDB2012] paper. There are several
challenges that arise when handling 2-kNN queries. These challenges include: </p>

<p class=MsoNormal style='text-indent:.5in;mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'>(1) Depending on the order of execution of the two <span
class=SpellE>kNN</span> operations, the result of a 2-kNN query will differ. </p>

<p class=MsoNormal style='text-indent:.5in;mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'>(2) How to determine what the correct answer for a 2-kNN
query should be and on what bases? </p>

<p class=MsoNormal style='text-indent:.5in;mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'>(3) How to efficiently execute a 2-kNN query while
preserving correctness? </p>

<p class=MsoNormal style='text-indent:.5in;mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'>(4) How to adapt well-known relational query
optimization strategies (e.g., pushing selects under joins in query evaluation
plans) to still be applicable in the context of 2-kNN queries?</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>Then, our research focused on expanding the capabilities
of multi-predicate location-based query servers beyond the class of 2-kNN
queries along several dimensions. We explored various combinations of relational
and spatial operations (Journal Papers: <span class=SpellE>GeoInformatica</span>
2013, VLDBJ 2013). We studied crowd-based database indexing techniques (<span
class=SpellE>DBCrowd</span> 2013, IEEE TKDE 2013), and semantic web
location-based linked data architectures (IEEE <span class=SpellE>BigData</span>
2013). </p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>In 2013-2014, we studied optimization issues of queries
that involve both spatial and relational predicates. We developed a novel cost
estimation model for <span class=SpellE>kNN</span> operations when executing in
conjunction with relational operators. We extend our research to trajectories with
limited histories (SIGSPATIAL 2014). We study <span class=SpellE>adaptivity</span>
of query execution plans in continuous streaming queries (EDBT 2014). We extend
our work to &quot;approximate&quot; nearest-neighbor computations in the
context of high-dimensional data, and proximity-based intersect operators
(SISAP 2014). Our work on dependency models when human actions are part of a
database transaction appears in (IEEE TKDE 2014).</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><span style='font-size:10.0pt'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b><span lang=FR style='font-size:18.0pt;mso-ansi-language:
FR'><o:p>&nbsp;</o:p></span></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><span class=SpellE><b><span lang=FR style='font-size:18.0pt;
mso-ansi-language:FR'>Research</span></b></span><b><span lang=FR
style='font-size:18.0pt;mso-ansi-language:FR'> <span class=SpellE>Activities</span>
and Publications:<o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><a
href="http://www.cs.purdue.edu/homes/aref/papers/vldb2012.pdf"><b
style='mso-bidi-font-weight:normal'>Spatial Queries with Two <span
class=SpellE>kNN</span> Predicates [VLDB 2012]</b></a><b style='mso-bidi-font-weight:
normal'><o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>The widespread use of location-aware devices has led to
countless location-based services in which a user query can be arbitrarily
complex, i.e., one that embeds multiple spatial <span class=GramE>selection</span>
and join predicates. Amongst these predicates, the k-Nearest-Neighbor (<span
class=SpellE>kNN</span>) predicate stands as one of the most important and
widely used predicates. Unlike related research, this research goes beyond the
optimization of queries with single <span class=SpellE>kNN</span> predicates,
and shows how queries with two <span class=SpellE>kNN</span> predicates can be
optimized. In particular, our research addresses the optimization of queries
with: </p>

<p class=MsoListParagraphCxSpFirst style='margin-left:.75in;mso-add-space:auto;
text-indent:-.5in;mso-pagination:none;mso-list:l0 level1 lfo2;mso-layout-grid-align:
none;text-autospace:none'><![if !supportLists]><span style='mso-list:Ignore'>(i)<span
style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]><span class=GramE>two</span> <span class=SpellE>kNN</span>-select
predicates</p>

<p class=MsoListParagraphCxSpMiddle style='margin-left:.75in;mso-add-space:
auto;text-indent:-.5in;mso-pagination:none;mso-list:l0 level1 lfo2;mso-layout-grid-align:
none;text-autospace:none'><![if !supportLists]><span style='mso-list:Ignore'>(ii)<span
style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]><span class=GramE>two</span> <span class=SpellE>kNN</span>-join
predicates, and </p>

<p class=MsoListParagraphCxSpLast style='margin-left:.75in;mso-add-space:auto;
text-indent:-.5in;mso-pagination:none;mso-list:l0 level1 lfo2;mso-layout-grid-align:
none;text-autospace:none'><![if !supportLists]><span style='mso-list:Ignore'>(iii)<span
style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]><span class=GramE>one</span> <span class=SpellE>kNN</span>-join
predicate and one <span class=SpellE>kNN</span>-select predicate. </p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>For each type of queries, conceptually correct query
evaluation plans (QEPs) and new algorithms that optimize the query execution
time are studied. Experimental results demonstrate that the proposed algorithms
outperform the conceptually correct QEPs by orders of magnitude. We conducted
the first complete study for the optimization of queries with two <span
class=SpellE>kNN</span> predicates. We demonstrated how traditional
optimization techniques <span class=GramE>can</span> compromise the correctness
of evaluation for a query that involves two interacting <span class=SpellE>kNN</span>
predicates. For different combinations of two <span class=SpellE>kNN</span>
predicates, we presented efficient algorithms that guarantee the correct- ness
of evaluation, and outperform the corresponding conceptually correct QEPs by
orders of magnitude. The algorithms introduced are designed for snapshot
queries. Applying further optimization techniques that can support incremental
evaluation of continuous queries with two <span class=SpellE>kNN</span>
predicates is a potential future work. Moreover, we believe that the ideas
introduced through this research pave the way towards a query optimizer that
can support spatial queries with more than two <span class=SpellE>kNN</span>
predicates.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><a
href="http://www.cs.purdue.edu/homes/aref/papers/m3-icde2012.pdf"><b
style='mso-bidi-font-weight:normal'>M3: Stream Processing on Main-Memory <span
class=SpellE>MapReduce</span> [ICDE 2012]</b></a><b style='mso-bidi-font-weight:
normal'><o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><span class=SpellE>MapReduce</span> has been a popular
framework for parallel computing to process <span class=GramE>large scale</span>
data on large scale computing clusters. However, most of the current
implementations of the <span class=SpellE>MapReduce</span> framework support
only the execution of fixed-input jobs. Such restriction makes these implementations
inapplicable for most streaming applications, in which queries are continuous
in nature and input data streams are continuously received at high arrival
rates. In this research, we realize M3, a prototype implementation of the <span
class=SpellE>Hadoop</span> <span class=SpellE>MapReduce</span> framework in
which continuous queries over streams of data can be efficiently answered.
Data-path in M3 is over main-memory only, bypassing the <span class=SpellE>Hadoop</span>
Distributed File System (HDFS) and any local disk accesses. M3 is resilient to
machine failures and utilizes the main-memory of the machines by dynamically
adapting to the fluctuations in the data arrival rates of the streams. M3
operates on time pulses, where it has a data acquisition layer with <span
class=SpellE>DataTasks</span> that collect streamed data chunks that arrive
during time periods. Map and Reduce tasks execute continuously while
periodically taking turns to process the chunks of data collected. This
research highlights techniques and challenges for realizing various modes of
synchronization and overlap in execution of tasks in M3. We envision that M3
will be the underlying massively distributed streaming engine for handling
city-scale streamed spatiotemporal data that we will be realizing next.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><a
href="http://www.cs.purdue.edu/homes/aref/papers/vldbj2013.pdf"><b
style='mso-bidi-font-weight:normal'>Similarity queries: their conceptual
evaluation, transformations, and processing [VLDB Journal 2013]</b></a><b
style='mso-bidi-font-weight:normal'><o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>This research forms the foundation for multi-predicate
spatial queries that involve <span class=SpellE>kNN</span> predicates. <span
class=GramE>Similarity queries is</span> one possible generalization of range
queries and <span class=SpellE>kNN</span> queries, where the former can be
viewed as a similarity operation (within epsilon similarity) while the latter
is a k-nearest-neighbors similarity. Many application scenarios can
significantly benefit from the identification and processing of spatial
similarities in the data. Even though some work has been done to extend the
semantics of some operators, for example join and selection, to be aware of
data similarities, there has not been much study on the role and implementation
of similarity-aware operations as first-class database operators. Furthermore,
very little work has addressed the problem of evaluating and optimizing queries
that combine several similarity operations. The focus of this research is the
study of similarity queries that contain one or multiple first-class similarity
database operators such as Similarity Selection, Similarity Join, and
Similarity Group-by. Particularly, we analyze the implementation techniques of
several similarity operators, introduce a consistent and comprehensive
conceptual evaluation model for similarity queries, and present a rich set of
transformation rules to extend cost-based query optimization to the case of
similarity queries.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>The focus of this research is the proposal and analysis of
several similarity database operators, and the thorough study of the evaluation
and optimization of similarity queries that combine multiple similarity
operators. We introduce a model for the conceptual evaluation of similarity
queries that clearly specifies the way a similarity query should be evaluated
even if it has multiple similarity operations. We present a rich set of
transformation rules for similarity queries to transform the conceptual
evaluation plan into more efficient plans. Furthermore, we demonstrate that transformation
rules for similarity queries can take advantage of special properties of the
similarity-aware operations and the involved distance functions to enable more
useful query transformations. We also extend the important Eager/Lazy
Aggregation transformation rules to the case of SGB and SJ. The experimental
evaluation of the proposed rules shows they are highly effective. We also show
that similarity operators can be efficiently implemented taking advantage of
structures and mechanisms already available in DBMSs. </p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><o:p>&nbsp;</o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><a
href="http://www.cs.purdue.edu/homes/aref/papers/geoinformatica2013.pdf"><b
style='mso-bidi-font-weight:normal'>Continuous aggregate nearest neighbor
queries [<span class=SpellE>GeoInformatica</span> 2013]</b></a><b
style='mso-bidi-font-weight:normal'><o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>This research addresses the problem of supporting continuous
aggregate nearest-neighbor (CANN) queries for moving objects in <span
class=SpellE>spatio</span>-temporal data stream management systems. A CANN
query specifies a set of landmarks, an integer k, and an aggregate distance
function f (e.g., min, max, or sum), where f computes the aggregate distance
between a moving object and each of the landmarks. The answer to this
continuous query is the set of k moving objects that have the smallest
aggregate distance f. A CANN query may also be viewed as a combined set of
nearest neighbor queries. We introduce several algorithms to continuously and
incrementally answer CANN queries. Extensive experimentation shows that the
proposed operators outperform the state-of-the-art algorithms by up to a factor
of 3 and incur low memory overhead. P-CANN is a best-effort progressive
algorithm that associates thresholds with the individual landmarks. These
thresholds are used to eagerly prune the moving objects. Different elimination
order policies are identified to specify the order of the landmarks in the
computation of the aggregate distance in P-CANN. The optimization of P-CANN and
how to assign the thresholds are addressed. From the performed extensive
experiments, we achieve cases whose performance is improved by up to a factor
of 3 from the state-of-the-art algorithm. P-CANN out-performs both H-CANN and
the CPM algorithm (the state of the art). For the optimization of P-CANNs, the <span
class=GramE>worst-fit</span> elimination policy gives the least penalty for sum
(additional 14% CPU cost away from optimal) when we do not use the
prohibitively expensive optimal order. On the other hand, the best-fit
elimination policy gives the least penalty for the max case. The optimization
time of P-CANN is about 100 <span class=SpellE>msec</span> for typical CANN
queries. P-CANN, which is a best-effort <span class=GramE>algorithm</span>
might produce 95% of the required output size on the average. As for future
work, we will investigate the continuous aggregate nearest neighbor queries on
moving objects in road networks. On the one hand, we would like to develop
similar incremental algorithms using the road network distance instead of the
Euclidean distance between the objects. On the other hand, we would like to
make a first-class operator in a data stream management system such that the
CANN operator is considered while optimizing the query evaluation plan.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><a
href="http://www.cs.purdue.edu/homes/aref/papers/dbcrowd2013.pdf"><b
style='mso-bidi-font-weight:normal'>The Palm-tree Index: Indexing with the
crowd [<span class=SpellE>DBCrowd</span> 2013]</b></a><b style='mso-bidi-font-weight:
normal'><o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>This research addresses using humans (the crowd) to
perform database indexing and searching operations. Crowdsourcing services
allow employing human intelligence in tasks that are difficult to accomplish
with computers such as image tagging and data collection. At a relatively low
monetary cost and through web interfaces such as Amazon’s Mechanical Turk
(AMT), humans can act as a computational operator in large systems. Recent work
has been conducted to build database management systems that can harness the
crowd power in database operators, such as sort, join, count, etc. The
fundamental problem of indexing within crowd-sourced databases has not been
studied. In this research, we study the problem of tree-based indexing within
crowd-enabled databases. We investigate the effect of various tree and
crowdsourcing parameters on the quality of index operations. We propose new
algorithms for index search, insert, and update. We propose <span class=GramE>a
taxonomy</span> of the problem and highlight its main challenges. We propose
techniques for index construction and querying. We intend to complete this
study with an extensive analysis and experimental evaluation. Our current work
focuses on one-dimensional indexing. We plan to study other variations of
crowd-sourced indexing, such as multidimensional indexing, spatial and <span
class=SpellE>spatio</span>-temporal indexing and fuzzy indexing.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><a
href="http://www.cs.purdue.edu/homes/aref/papers/bigdata2013.pdf"><b
style='mso-bidi-font-weight:normal'>Knowledge Cubes - A Proposal for Scalable
and <span class=GramE>Semantically-Guided</span> Management of Big Data [IEEE <span
class=SpellE>BigData</span> 2013]</b></a><b style='mso-bidi-font-weight:normal'><o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>A Knowledge Cube, or cube for short, is an intelligent and
adaptive database instance capable of storing, analyzing, and searching data.
Each cube is established based on a set of semantic aspects, e.g., (1) Topical,
(2) Contextual, (3) Spatial, or (4) Temporal. A cube specializes in handling
data that is only relevant to its semantic aspect. Knowledge cubes are inspired
by two prime architectures: (1) &quot;<span class=SpellE>Dataspaces</span>&quot;
that provides an abstraction for data management where heterogeneous data
sources can co-exist and it requires no unifying schema to be specified in
advance (2) &quot;Linked Data&quot; that provides a set of best practices for
publishing and interlinking structured data on the web. A knowledge cube uses
the best practices of Linked Data as its main building block for its data layer
and encompasses some of the data integration abstractions defined by <span
class=SpellE>Dataspaces</span>. In this research, we propose knowledge cubes as
a <span class=GramE>semantically-guided</span> data management architecture,
where data management is influenced by the data semantics rather than by a
predefined scheme. Knowledge cubes support the five pillars of Big Data also
known as the five <span class=GramE>V's :</span> Volume, Velocity, Veracity,
Variety, and Value. Many interesting opportunities can be leveraged when
learning the semantics of the data. In the research, we highlight these
opportunities and propose a <span class=SpellE>strawman</span> design for
knowledge cubes along with the research challenges that arise when realizing
them. Our research forms a vision for the knowledge cube architecture that
motivates understanding the semantics of the data as a mean for solving some of
the research challenges we face today, specifically in Big Data.<span
style="mso-spacerun:yes">  </span>We also motivate the use of Linked Data as a
mean for achieving this target given the rich semantics that Linked Data
provides. We illustrate some of the challenges and potential solutions
associated with the knowledge cubes proposal. Finally, we demonstrate how the
proposed architectural components can be used to tackle the five pillars of Big
Data.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p style='margin:0in;margin-bottom:.0001pt'><a
href="http://www.cs.purdue.edu/homes/aref/papers/edbt2014.pdf"><b
style='mso-bidi-font-weight:normal'>JISC: Adaptive Stream Processing Using
Just-In-Time State Completion [EDBT 2014]</b></a><b style='mso-bidi-font-weight:
normal'><o:p></o:p></b></p>

<p style='margin:0in;margin-bottom:.0001pt'>The continuous and dynamic nature
of data streams may lead a query execution plan (QEP) of a long-running
continuous query to become suboptimal during execution, and hence will need to
be altered. The ability to perform an efficient and flawless transition to an
equivalent, yet optimal QEP is essential for a data stream query processor.
Such transition is challenging for plans with <span class=SpellE>stateful</span>
binary operators, such as joins, where the states of the QEP have to be
maintained during query transition without compromising the correctness of the
query output. In this research, we develop a Just-In-Time State Completion
(JISC)<span class=GramE>;</span> a new technique for query plan migration. JISC
does not cause any halt to the query execution, and thus allows the query to
maintain steady output. JISC is applicable to pipelined as well as eddy-based
query evaluation frameworks. During plan transition, JISC maintains steady
query output in contrast to existing plan adaptation techniques that can
exhibit significant output latencies. Maintaining steady query output is
essential for applications that require continuous monitoring or real-time
response. JISC employs a lazy state migration strategy that computes the
missing states in the new QEP on-demand in a single QEP. In highly dynamic
scenarios where the queries and streams have fluctuating <span class=SpellE>selectivities</span>
and arrival rates, overlapped plan transitions are imminent. The lazy migration
strategy enables JISC to avoid performance thrashing, which is a vital issue in
all other existing techniques. A key property of JISC is that during plan
transition, it detects the unchanged parts of the QEP and avoids <span
class=SpellE>recomputing</span> their states. Our probabilistic analysis
demonstrates that the number of operators with unchanged states in the new QEP
is usually close to the total number of operators. For that reason, JISC
outperforms existing techniques that also maintain steady query output, e.g.,
the Parallel Track Strategy, leading to performance gains during a plan
migration stage that can reach up to an order of magnitude.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p style='margin:0in;margin-bottom:.0001pt'><a
href="http://www.cs.purdue.edu/homes/aref/papers/sigspatial2014.pdf"><b
style='mso-bidi-font-weight:normal'>Indexing Recent Trajectories of Moving
Objects [ACM SIGSPATIAL 2014]</b></a><b style='mso-bidi-font-weight:normal'><o:p></o:p></b></p>

<p style='margin:0in;margin-bottom:.0001pt'>Advances in location-aware and
object-tracking devices have led to the development of location-based services
that process large amounts of <span class=SpellE>spatio</span>-temporal data.
The need for efficient processing of queries on the locations of moving objects
calls for trajectory-based indexing methods. These indexes need to capture both
the spatial and temporal dimensions of the data in a way that minimizes the
number of disk I/<span class=SpellE>Os</span> required for both updating and
querying. Most existing <span class=SpellE>spatio</span>-temporal index
structures capture either the current locations of the moving objects or the
entire history of the moving objects. However, many applications require that
only the recent history of a moving object's trajectory be stored. This
research introduces the trails-tree<span class=GramE>;</span> a disk-based data
structure for indexing the recent history of moving objects' trajectories. The
trails-tree maintains a temporal-sliding window over trajectories and uses: (1)
an in-memory memo structure that reduces the I/O cost of updates using a
lazy-update mechanism, and (2) lazy vacuum-cleaning mechanisms to delete parts
of the trajectories that fall out of the sliding window. Theoretical analysis
and experimental evaluation illustrate that the trails-tree outperforms the
state-of-the art index structures for indexing recent trajectory data by up to
a factor of two.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p style='margin:0in;margin-bottom:.0001pt'><b style='mso-bidi-font-weight:
normal'><a href="http://www.cs.purdue.edu/homes/aref/papers/sisap2014.pdf">The
Similarity-aware Relational Intersect Database Operator [SISAP 2014] (Best
Paper Award)</a><o:p></o:p></b></p>

<p style='margin:0in;margin-bottom:.0001pt'>Identifying similarities in large
datasets is an essential operation in many applications such as bioinformatics,
pattern recognition, and data integration. To make the underlying database
system similarity-aware, the core relational operators have to be extended.
Several similarity-aware relational operators have been proposed that introduce
similarity processing at the database engine level, e.g., similarity joins and
similarity group-by. In this research, we extend the semantics of the set
intersection operator to operate over similar values. </p>

<p style='margin:0in;margin-bottom:.0001pt'>We introduced the semantics and
extended SQL syntax of the similarity-based set intersection operator. We
developed an algorithm that is based on a Mark/Restore mechanism to avoid the <span
class=GramE>O(</span>n^2) complexity. The proposed operator is implemented
inside an open-source database system, namely <span class=SpellE>PostgreSQL</span>.
Several queries from the TPC-H benchmark are extended to include
similarity-based set intersection predicates. Our implementation of the
proposed operator outperforms the queries that produce the same result using
only regular operations. The speedup ranges between 1000 and 4 times for
similarity threshold values ranging between 0.01% and 10% of the attribute
domain range. We also demonstrated that the added functionality is achieved
without a big overhead when compared to standard operators.</p>

<p style='margin:0in;margin-bottom:.0001pt'><span style='font-size:10.5pt'><o:p>&nbsp;</o:p></span></p>

<p style='margin:0in;margin-bottom:.0001pt'><b style='mso-bidi-font-weight:
normal'><a
href="http://www.cs.purdue.edu/homes/aref/papers/handsondb-tkde2014.pdf"><span
class=SpellE>HandsOn</span> DB: Managing Data Dependencies Involving Human
Actions [TKDE 2014]</a><o:p></o:p></b></p>

<p style='margin:0in;margin-bottom:.0001pt'>Consider two values, x and y, in
the database, where y = <span class=GramE>F(</span>x). To maintain the
consistency of the data, whenever x changes, F needs to be executed to
re-compute y and update its value in the database. This is straightforward in
the case where F can be executed by the DBMS, e.g., SQL or C function. In this
published research in [TKDE 2014], we address the more challenging case where F
is a human action, e.g., conducting a wet-lab experiment, taking manual
measurements, or collecting instrument readings. In this case, when x changes,
y remains invalid (inconsistent with the current value of x) until the human
action involved in the derivation is performed and its output result is
reflected into the database. Many application domains, e.g., scientific
applications in biology, chemistry, and physics, contain multiple such
derivations and dependencies that involve human actions. In this research, we
introduce <span class=SpellE>HandsOn</span> DB, a prototype database engine for
managing dependencies that involve human actions while maintaining the
consistency of the derived data. <span class=SpellE>HandsOn</span> DB includes
the following features: (1) semantics and syntax for interfaces through which
users can register human activities into the database and express the
dependencies among the data items on these activities; (2) mechanisms for
invalidating and revalidating the derived data; and (3) new operator semantics
that alert users when the returned query results contain potentially invalid
data, and enable evaluating queries on either valid data only, or both valid
and potentially invalid data. Performance results are presented that study the
overheads associated with these features and demonstrate the feasibility and
practicality in realizing <span class=SpellE>HandsOn</span> DB.</p>

<p style='margin:0in;margin-bottom:.0001pt'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><a
href="http://www.cs.purdue.edu/homes/aref/papers/limo2014.pdf">LIMO: A
Web-based Environment for Learning Programming using Interactive Map Operations
[Technical Report 2014]</a><o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>Learning how to write computer programs is often
challenging for the novice with little or no coding experience. Many
pedagogical programming environments motivate programming with intuitive
syntax-free interfaces, interesting real-world contexts, and animated output.
In this research, we introduce LIMO; a web-based programming environment that
is centered around operation on interactive geographical maps,
location-oriented data, and the operations of synthetic objects that move on
the maps. LIMO materializes a low-cost open-ended environment that integrates
interactive maps and spatial data (e.g., <span class=SpellE>OpenStreetMap</span>).
The unique advantage of LIMO is that it relates programming concepts to
geographical maps and locations that have basis in reality. LIMO offers an
environment for learning how to program by providing 1) map and programming
constructs, 2) high-quality interactive map graphics, and 3) example programs
that introduce users to writing programs in the LIMO environment.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>AQWA: Adaptive
Query-Workload-Aware Partitioning of Big Spatial Data [VLDB 2016 – Full Paper
(To Appear)] (</b><a
href="https://www.cs.purdue.edu/homes/aref/papers/aqwa2016.pdf"><b
style='mso-bidi-font-weight:normal'>paper</b></a><b style='mso-bidi-font-weight:
normal'>) (</b><a href="https://github.com/ahmed-m-aly/AQWA"><b
style='mso-bidi-font-weight:normal'>AQWA code</b></a><b style='mso-bidi-font-weight:
normal'>)<o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>In support of big spatial data, this research focuses on
the data layer in a cluster-based platform. The motivation for this research is
the unprecedented spread of location-aware devices that has resulted in a
plethora of location-based services in which huge amounts of spatial data need
to be efficiently processed by large-scale computing clusters. Existing
cluster-based systems for processing spatial data employ static data
partitioning structures that cannot adapt to data changes, and that are
insensitive to the query-workload. Hence, these systems are not able to
consistently provide good performance. To close this gap, we present AQWA, an
adaptive and query-workload-aware data partitioning mechanism for processing
large-scale spatial data. AQWA does not assume prior knowledge of the data
distribution or the query-workload. Instead, AQWA incrementally reacts to
changes in both the data and the query-workload. As data is consumed and
queries are processed, the data partitions are incrementally updated. With
extensive experiments using real spatial data from Twitter, we demonstrate that
AQWA can achieve an order of magnitude gain in query performance compared to
standard spatial partitioning structures.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>Spatial Queries with
k-Nearest-Neighbor and Relational Predicates [ACM SIGSPATIAL 2015 – Full Paper]
(</b><a
href="https://www.cs.purdue.edu/homes/aref/papers/sigspatial-knn2015.pdf"><b
style='mso-bidi-font-weight:normal'>paper</b></a><b style='mso-bidi-font-weight:
normal'>) (</b><a href="https://github.com/ahmed-m-aly/kNN-Relational"><b
style='mso-bidi-font-weight:normal'>Code</b></a><b style='mso-bidi-font-weight:
normal'>)<o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>This research is an important milestone for this project
as it shows all the feasible optimizations when k-Nearest-Neighbor (<span
class=SpellE>kNN</span>, for short) predicates are intermixed with relational
predicates in SQL-like query languages. This research is motivated by the
ubiquity of location-aware devices and smartphones that has unleashed an
unprecedented proliferation of location-based services that require processing
queries with both spatial and relational predicates. Many algorithms and index
structures already exist for processing <span class=SpellE>kNN</span>
predicates either solely or when combined with textual keyword search.
Unfortunately, there has not been enough study on how to efficiently process
queries where <span class=SpellE>kNN</span> predicates are combined with
general relational predicates, i.e., ones that have selects, joins and group-<span
class=SpellE><span class=GramE>by’s</span></span><span class=GramE>.</span> One
major challenge is that because the <span class=SpellE>kNN</span> is a ranking
operation, applying a relational predicate before or after a <span
class=SpellE>kNN</span> predicate in a query evaluation pipeline (QEP, for
short) can result in different outputs, and hence leads to different query
semantics. In particular, this renders classical relational query optimization
heuristics, e.g., pushing selects below joins, inapplicable. This research
introduces and studies various query optimization heuristics for queries that
involve combinations of <span class=SpellE>kNN</span> select/join predicates
and relational predicates. The proposed optimizations can significantly enhance
the performance of these queries while preserving their semantics. Experimental
results that are based on queries from the TPC-H benchmark and real spatial
data from <span class=SpellE>OpenStreetMap</span> demonstrate that the proposed
optimizations can achieve orders of magnitude enhancement in query performance.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>Cost Estimation of
Spatial k-Nearest-Neighbor Operators EDBT 2015 (</b><a
href="https://www.cs.purdue.edu/homes/aref/papers/knn-cost-edbt2015.pdf"><b
style='mso-bidi-font-weight:normal'>paper</b></a><b style='mso-bidi-font-weight:
normal'>) (</b><a href="https://github.com/ahmed-m-aly/kNN-Relational"><b
style='mso-bidi-font-weight:normal'>Code</b></a><b style='mso-bidi-font-weight:
normal'>)<o:p></o:p></b></p>

<p style='margin:0in;margin-bottom:.0001pt'>Advances in geo-sensing technology
have led to an unprecedented spread of location-aware devices. In turn, this
has resulted into a plethora of location-based services in which huge amounts
of spatial data need to be efficiently consumed by spatial query processors.
For a spatial query processor to properly choose among the various <span
class=GramE>query processing</span> strategies, the cost of the spatial
operators has to be estimated. In this research, we study the problem of
estimating the cost of the spatial k-nearest-neighbor (k-NN, for short)
operators, namely, k-NN-Select and k-NN-Join. Given a query that has a k-NN
operator, the objective is to estimate the number of blocks that are going to
be scanned during the processing of this operator. Estimating the cost of a
k-NN operator is challenging for several reasons. For instance, the <span
class=GramE>cost of a k-NN-Select operator is directly affected by the value of
k, the location of the query focal point, and the distribution of the data</span>.
Hence, a cost model that captures these factors is relatively hard to realize.
This study introduces cost estimation techniques that maintain a compact set of
catalog information that can be kept in main-memory to enable fast estimation
via lookups. A detailed study of the performance and accuracy trade-off of each
proposed technique is presented. Experimental results using real spatial
datasets from <span class=SpellE>OpenStreetMap</span> demonstrate the
robustness of the proposed estimation techniques. </p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><o:p>&nbsp;</o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>A Demonstration of
AQWA: Adaptive Query Workload Aware Partitioning of Big Spatial Data<span
style="mso-spacerun:yes">  </span>[VLDB 2015 Demo paper] (</b><a
href="https://www.cs.purdue.edu/homes/aref/papers/vldb2015-aqwa-demo.pdf"><b
style='mso-bidi-font-weight:normal'>Demo paper</b></a><b style='mso-bidi-font-weight:
normal'>) (</b><a href="https://github.com/ahmed-m-aly/AQWA"><b
style='mso-bidi-font-weight:normal'>AQWA code</b></a><b style='mso-bidi-font-weight:
normal'>)<o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>During Academic Year 2014-2015, we have realized a
prototype open-source system for AQWA. AQWA is motivated by the needs for
efficiently organizing Big Spatial Data. The ubiquity of location-aware
devices, e.g., smartphones and GPS-devices, has led to a variety of
location-based services in which huge amounts of geo-tagged information is
created every day. This prototype system demonstrates AQWA, a novel mechanism
for partitioning large-scale spatial data over distributed clusters. Unlike
existing cluster-based systems, e.g. <span class=SpellE>SpatialHadoop</span>,
that apply static partitioning of spatial data, AQWA has the ability to react
to changes in query-workload or data distribution. A key feature of AQWA is
that it does not assume prior knowledge of the query-workload or data
distribution. Instead, AQWA adapts to changes in the query-workload or data
distribution in an online fashion by incrementally updating the partitioning of
the data in a way that enhances the query execution time. We demonstrate two
real prototypes of AQWA applied to both <span class=SpellE>Hadoop</span> and
Spark platforms. In both prototypes, we process spatial range and
k-nearest-neighbor queries over large-scale real and synthetic datasets, and
exploit the performance of AQWA under different query-workloads. Currently, we
are making the code for AQWA on <span class=SpellE>Hadoop</span> publicly
available. </p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>Tornado: A
Distributed <span class=SpellE>SpatioTextual</span> Stream Processing System
[VLDB 2015 Demo paper] (<a
href="https://www.cs.purdue.edu/homes/aref/papers/vldb2015-tornado-demo.pdf">Demo
paper</a>)<o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>During Academic Year 2014-2015, we have realized a
prototype open-source system termed Tornado. Tornado is motivated by the needs for
efficiently querying Big Spatial Data. Nowadays, most spatial data is also
associated with text data. The widespread use of location-aware devices
together with the increased popularity of micro-blogging applications (e.g.,
Twitter) has led to the creation of large streams of <span class=SpellE>spatio</span>-textual
data. In order to serve real-time applications, the processing of these
large-scale <span class=SpellE>spatio</span>-textual streams needs to be
distributed. However, existing distributed stream processing systems (e.g.,
Spark and Storm) are not optimized for spatial/textual content. In this
demonstration, we introduce Tornado, a distributed in-memory <span
class=SpellE>spatio</span>-textual <span class=GramE>stream processing</span>
server that extends Storm. To efficiently process <span class=SpellE>spatio</span>-textual
streams, Tornado introduces a <span class=SpellE>spatio</span>-textual indexing
layer to the architecture of Storm. The indexing layer is adaptive, i.e.,
dynamically re-distributes the processing across the system according to
changes in the data distribution and/or query workload. In addition to
keywords, higher-level textual concepts are identified and are semantically
matched against <span class=SpellE>spatio</span>-textual queries. Tornado
provides data de-duplication and fusion to eliminate redundant textual data. We
demonstrate a prototype of Tornado running against real Twitter streams, where
the users can register continuous or snapshot <span class=SpellE>spatio</span>-textual
queries using a map-assisted query interface.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><o:p>&nbsp;</o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>Kangaroo:
Workload-Aware Processing of Range Queries in <span class=SpellE>Hadoop</span>
[WSDM 2016 – Full Paper] (</b><a
href="https://www.cs.purdue.edu/homes/aref/papers/wsdm2016.pdf"><b
style='mso-bidi-font-weight:normal'>paper</b></a><b style='mso-bidi-font-weight:
normal'>)<o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>Despite the importance and widespread use of range data,
e.g., time intervals, spatial ranges, etc., little attention has been devoted
to study the processing and querying of range data in the context of big data.
The main challenge relies in the nature of the traditional index structures,
e.g., B-Tree and R-Tree, being centralized by nature, and hence are almost
crippled when deployed in a distributed environment. To address this challenge,
in this study, we prototype Kangaroo, a system built on top of <span
class=SpellE>Hadoop</span> to optimize the execution of range queries over
range data. The main idea behind Kangaroo is to split the data into
non-overlapping partitions in a way that minimizes the query execution time.
Kangaroo is query workload aware, i.e., results in partitioning layouts that
minimize the query processing time of given query patterns. In this study, we
expose and address the design challenges Kangaroo addresses in order to be
deployed on top of a distributed file system, i.e., HDFS. We also study four
different partitioning schemes that Kangaroo can support. With extensive
experiments using real range data of more than one billion records and real
query workload of more than 30,000 queries, we show that the partitioning
schemes of Kangaroo can significantly reduce the I/O of range queries on range
data.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><o:p>&nbsp;</o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>Graph Indexing for
Shortest-Path Finding over Dynamic Sub-Graphs [SIGMOD 2016 – Full Paper] (</b><a
href="https://www.cs.purdue.edu/homes/aref/papers/sigmod2016.pdf"><b
style='mso-bidi-font-weight:normal'>paper</b></a><b style='mso-bidi-font-weight:
normal'>)<o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>A variety of applications spanning various domains, e.g.,
social networks, transportation, and bioinformatics, have graphs as first-class
citizens. These applications share a vital operation, namely, finding the
shortest path between two nodes. In many scenarios, users are interested in
filtering the graph before finding the shortest path. For example, in social
networks, one may need to compute the shortest path between two persons on a
sub-graph containing only family relationships. This research focuses on
dynamic graphs with labeled edges, where the target is to find a shortest path
after filtering some edges based on user-specified query labels. This problem
is termed the Edge-Constrained Shortest Path query (or ECSP, for short). This research
introduces Edge-Disjoint Partitioning (EDP, for short), a new technique for
efficiently answering ECSP queries over dynamic graphs. EDP has two main
components: a dynamic index that is based on <span class=GramE>graph</span>
partitioning, and a traversal algorithm that exploits the regular patterns of
the answers of ECSP queries. EDP partitions the graph based on the labels of
the edges. On demand, EDP computes specific sub-paths within each partition and
updates its index. The computed sub-paths are cached and can be leveraged by
future queries. To answer an ECSP query, EDP connects sub-paths from different
partitions using its efficient traversal algorithm. EDP can dynamically handle
various types of graph updates, e.g., label, edge, and node updates. The index
entries that are potentially affected by graph updates are invalidated and are
re-computed on demand. EDP is evaluated using real graph datasets from various
domains. Experimental results demonstrate that EDP can achieve query performance
gains of up to four orders of magnitude in comparison to state of the art
techniques.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>Cruncher:
Distributed In-Memory Processing for Location-Based Services [IEEE ICDE 2016] (<a
href="https://www.cs.purdue.edu/homes/aref/papers/icde2016-cruncher.pdf">Demo paper</a>)<o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>Advances in location-based services (LBS) demand high-throughput
processing of both static and streaming data. Recently, many systems have been
introduced to support distributed main-memory processing to maximize the query
throughput. However, these systems are not optimized for spatial data
processing. In this system, we showcase Cruncher, a distributed main-memory spatial
data warehouse and streaming system. Cruncher extends Spark with adaptive query
processing techniques for spatial data. Cruncher uses dynamic batch processing to
distribute the queries and the data streams over commodity hardware according
to an adaptive partitioning scheme. The batching technique also groups and
orders the overlapping spatial queries to enable inter-query optimization. Both
the data streams and the offline data share the same partitioning strategy that
allows for data co-locality optimization. Furthermore, Cruncher uses an
adaptive caching strategy to maintain the <span class=GramE>frequently-used</span>
location data in main memory. Cruncher maintains operational statistics to
optimize query processing, data partitioning, and caching at runtime. We
demonstrate two LBS applications over Cruncher using real datasets from <span
class=SpellE>OpenStreetMap</span> and two synthetic data streams. We
demonstrate that Cruncher achieves order(s) of magnitude throughput improvement
over Spark when processing spatial data.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><o:p>&nbsp;</o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>Efficient
Processing of Hamming-Distance-Based Similarity Search Queries Over <span
class=SpellE>MapReduce</span> [EDBT 2015] (</b><a
href="https://www.cs.purdue.edu/homes/aref/papers/hamming-dist-edbt2015.pdf"><b
style='mso-bidi-font-weight:normal'>paper</b></a><b style='mso-bidi-font-weight:
normal'>) <o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>Similarity and proximity searches are crucial to many
applications. Of particular interest are two flavors of the Hamming distance
range query, namely, the Hamming select and the Hamming join (Hamming-select
and Hamming-join, respectively). Hamming distance is widely used in approximate
near neighbor search for high dimensional data, such as images and document
collections. For example, using predefined similarity hash <span class=GramE>functions,</span>
high-dimensional data is mapped into one-dimensional binary codes that are, then
linearly scanned to perform Hamming-distance comparisons. These distance
comparisons on the binary codes are usually costly and, often involve excessive
redundancies. In this study, we introduce a new index, termed the HA-<span
class=GramE>Index, that</span> speeds up distance comparisons and eliminates
redundancies when performing the two flavors of Hamming distance range queries.
An efficient search algorithm based on the HA-index is presented. A distributed
version of the HA-index is introduced and algorithms for realizing Hamming
distance-select and Hamming distance-join operations on a <span class=SpellE>MapReduce</span>
platform are prototyped. Extensive experiments using real datasets demonstrates
that the HA-index and the corresponding search algorithms achieve up to two
orders of magnitude speedup over existing state-of-the-art approaches, while
saving more than ten times in memory space. <b style='mso-bidi-font-weight:
normal'><o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><o:p>&nbsp;</o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>Geo-tagging
Non-Spatial Concepts [ACM SIGSPATIAL Mobile GIS workshop 2015<span
style="mso-spacerun:yes">  </span>- To Appear] (</b><a
href="https://www.cs.purdue.edu/homes/aref/papers/sigspatial-mobigis-geotagging2015.pdf"><b
style='mso-bidi-font-weight:normal'>paper</b></a><b style='mso-bidi-font-weight:
normal'>)<o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>This research addresses a new interesting type of queries,
namely, geo-tagging non-spatial concepts. For example, consider the following
queries: Show on the map potential crime locations in Chicago, or show on the
map potential pollution regions in San Francisco. Because “crime” and
“pollution” are non-spatial concepts, it is hard to <span class=GramE>pin-point</span>
a location on the map to place these concepts.<span style="mso-spacerun:yes"> 
</span>In general, Concept Geo-tagging is the process of assigning a textual
identifier that describes a real-world entity to a physical geographic
location. A concept can either be a spatial concept where it possesses a
spatial presence or be a non-spatial concept where it has no explicit spatial
presence. Geo-tagging locations with non-spatial concepts that have no direct
relation is a very useful and important operation but is also very challenging.
The reason is that, being a non-spatial concept, e.g., <span class=GramE>crime,</span>
makes it hard to geo-tag it. In this study, we propose to use the semantic
information associated with concepts and locations such as the type as a mean
for identifying these relations. The co-occurrence of spatial and non-spatial
concepts within the same textual resources, e.g., in the web, can be an
indicator of a relationship between these spatial and non-spatial concepts.
Techniques are presented for learning and modeling relations among spatial and
non-spatial concepts from web textual resources. Co-occurring concepts are
extracted and modeled as a graph of relations. This graph is used to infer the
location types related to a concept. A location type can be a hospital,
restaurant, an educational facility and so forth. Due to the immense number of
relations that are generated from the extraction process, a <span class=GramE>semantically-guided</span>
query processing algorithm is introduced to prune the graph to the most
relevant set of related concepts. For each concept, the most relevant types are
matched against the location types. Experiments evaluate the proposed algorithm
based on its filtering efficiency and the relevance of the discovered
relationships. Performance results illustrate how <span class=GramE>semantically-guided</span>
query processing can outperform the baseline in terms of efficiency and
relevancy. The proposed approach achieves an average precision of 74% across
three different datasets.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>LIMO: Learning
Programming using Interactive Map Activities [ACM SIGSPATIAL 2015 Demo Paper] (</b><a
href="https://www.cs.purdue.edu/homes/aref/papers/sigspatial-limo-demo2015.pdf"><b
style='mso-bidi-font-weight:normal'>Demo paper</b></a><b style='mso-bidi-font-weight:
normal'>)<o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>Advances in geographic information, interactive two- and
three-dimensional map visualization accompanied with the proliferation of
mobile devices and location data have tremendously benefited the development of
geo-educational applications. We demonstrate LIMO; a web-based programming environment
that is centered around operations on interactive geographical maps,
location-oriented data, and the operations of synthetic objects that move on
the maps. LIMO materializes a low-cost open-ended environment that integrates
interactive maps and spatial data (e.g., Open-<span class=SpellE>StreetMap</span>).
The unique advantage of LIMO is that it relates programming concepts to
interactive geo- graphical maps and location data. LIMO offers an environment
for students to learn how to program by providing 1. <span class=GramE>an</span>
easy to program library of map and spatial operations, 2. <span class=GramE>high</span>-quality
interactive map graphics, and 3. <span class=GramE>example</span> programs that
introduce users to writing programs in the LIMO environment.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>On Map-Centric
Programming Environments [ACM SIGSPATIAL 2015 Vision Paper] (</b><a
href="https://www.cs.purdue.edu/homes/aref/papers/sigspatial-limo-vision2015.pdf"><b
style='mso-bidi-font-weight:normal'>Vision paper</b></a><b style='mso-bidi-font-weight:
normal'>)<o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>2D maps and 3D globes can be used as programming toys to
help students learn programming in contrast to using robots, visual, or
multimedia components in Computer Science I introductory programming courses.
This study exposes research challenges related to supporting this concept, and
presents one instance of a 2D and 3D map-based programming environment to
motivate these challenges.</p>

<p class=MsoNormal><o:p>&nbsp;</o:p></p>

<p class=MsoNormal><b style='mso-bidi-font-weight:normal'>Similarity Group-by
Operators for Multi-dimensional Relational Data [IEEE TKDE] (<a
href="https://www.cs.purdue.edu/homes/aref/papers/tkde2015-similarity-group-operators.pdf">paper</a>)<o:p></o:p></b></p>

<p class=MsoNormal>The SQL group-by operator plays an important role in summarizing
and aggregating large datasets in a data analytics stack. While the standard
group-by operator, which is based on equality, is useful in several
applications, allowing proximity-aware grouping provides a more realistic view
on real-world data that could lead to better insights. The Similarity SQL-based
Group-By operator (SGB, for short) extends the semantics of the standard SQL
Group-by by grouping data with similar but not necessarily equal values. While
existing similarity-based grouping operators efficiently realize these
approximate semantics, they primarily focus on one-dimensional attributes and
treat multi-dimensional attributes independently. However, correlated
attributes, such as in spatial data, are processed independently, and hence, groups
in the multi-dimensional space are not detected properly. To address this
problem, we introduce two new SGB operators for multi-dimensional data. The
first operator is the clique (or distance-to-all) SGB, where all the tuples in
a group are within some distance from each other. The second operator is the
distance-to-any SGB, where a tuple belongs to a group if the tuple is within
some distance from any other tuple in the group. Since a tuple may satisfy the
membership criterion of multiple groups, we introduce three different semantics
to deal with such a case: (<span class=SpellE>i</span>) eliminate the tuple,
(ii) put the tuple in any one group, and (iii) create a new group for this
tuple. We implement and test the new SGB operators and their algorithms inside <span
class=SpellE>PostgreSQL</span>. The overhead introduced by these operators
proves to be minimal and the execution times are comparable to those of the
standard Group-by. The experimental study, based on TPC-H and a social check-in
data, demonstrates that the proposed algorithms can achieve up to three orders
of magnitude enhancement in performance over baseline methods developed to
solve the same problem.</p>

<p class=MsoNormal><b style='mso-bidi-font-weight:normal'><o:p>&nbsp;</o:p></b></p>

<p class=MsoNormal><b style='mso-bidi-font-weight:normal'>The Similarity-aware
Relational Database Set Operators [Information Systems Journal, 2015] (<a
href="https://www.cs.purdue.edu/homes/aref/papers/information-systems-journal2015.pdf">paper</a>)<o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>Finding data items in the proximity of a query item can be
formulated as a similarity operation. Identifying these similarities in large
datasets is an essential operation in several applications such as
bioinformatics, pattern recognition, and data integration. To make a relational
database management system similarity-aware, the core relational operators have
to be extended. While similarity-awareness has been introduced in database
engines for relational operators such as joins and group-by, little has been
achieved for relational set operators, namely Intersection, Difference, and
Union. In this paper, we propose to extend the semantics of relational set
operators to take into account the similarity of values. We develop efficient
query processing algorithms for evaluating them, and implement these operators
inside an open-source database system, namely <span class=SpellE>PostgreSQL</span>.
By extending several queries from the TPC-H benchmark to include predicates
that involve similarity-based set operators, we perform extensive experiments
that demonstrate up to three orders of magnitude speedup in performance over
equivalent queries that only employ regular operators.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>ORLF: A Flexible
Framework for Online Record Linkage and Fusion [IEEE ICDE 2016] (<a
href="https://www.cs.purdue.edu/homes/aref/papers/icde2016-elkindi.pdf">Demo
paper</a>)<o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>With the exponential growth of data on the Web comes the
opportunity to integrate multiple sources to give more accurate answers to user
queries. Upon retrieving records from multiple Web databases, a key task is to
merge records that refer to the same real-world entity. We demonstrate ORLF (Online
Record Linkage and Fusion), a flexible query-time record linkage and fusion
framework. ORLF de-duplicates newly arriving query results jointly with
previously processed query results. We use an iterative caching solution that
leverages query locality to effectively de-duplicate newly incoming records
with cached records. ORLF aims to deliver timely query answers that are duplicate-free
and reflect knowledge collected from previous queries.</p>

<p class=MsoNormal><b style='mso-bidi-font-weight:normal'><o:p>&nbsp;</o:p></b></p>

<p class=MsoNormal><b style='mso-bidi-font-weight:normal'>Approving Updates in
Collaborative Databases [IEEE IC2E 2015] (<a
href="https://www.cs.purdue.edu/homes/aref/papers/ic2e2015.pdf">paper</a>)<o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>Although this research was motivated by and was started in
the context of cleaning dirty spatial data, the techniques developed proved to
be useful and generally applicable to many application domains including
scientific data <span class=SpellE>curation</span>. Data <span class=SpellE>curation</span>
activities, especially in collaborative databases, mandate that collaborators
interact until they converge and agree on the content of their data. Typically,
updates by a member of the collaboration are made visible to all collaborators
for comments but at the same time are pending the approval or rejection of the
data custodian, e.g., the principal scientist or investigator (PI). In current
database technologies, approval and authorization of updates are based solely
on the identity of the user, e.g., via the SQL GRANT and REVOKE commands.
However, in collaborative environments, the updated data is open for
collaborators for discussion and further editing and is finally approved or
rejected by the PI based on the content of the data and not on the identity of
the updater. In this research, we introduce a cloud-based collaborative
database system that promotes and enables collaboration and data <span
class=SpellE>curation</span> scenarios. We realize content-based update
approval and history tracking of updates inside <span class=SpellE>HBase</span>,
a distributed and scalable open-source cluster-based database. The design and
implementation as well as a detailed performance study of several approaches
for update approval are investigated and alternative techniques are contrasted.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal><b style='mso-bidi-font-weight:normal'>Precision-Bounded
Access Control Using Sliding-Window Query Views for Privacy-Preserving Data
Streams [TKDE 2015] (<a
href="https://www.cs.purdue.edu/homes/aref/papers/tkde2015-zahid.pdf">paper</a>)<o:p></o:p></b></p>

<p class=MsoNormal>This research extends spatial indexing and spatial query
processing techniques to apply in the context of access control and preserving
privacy over data streams. Access control mechanisms and Privacy Protection
Mechanisms (PPM) have been proposed for data streams. The access control for a
data stream allows roles access to tuples satisfying an authorized predicate
sliding-window query. Sharing the sensitive stream data without PPM can
compromise the privacy. The PPM meets privacy requirements, e.g., k-anonymity
or l-diversity by generalization of stream data. <span class=GramE>Imprecision
introduced by generalization can be reduced by delaying the publishing of
stream data</span>. However, the delay in sharing the stream tuples to achieve
better accuracy can lead to false-negatives if the tuples are held by PPM while
the query predicate is evaluated. Administrator of an access control policy
defines the imprecision bound for each query. The challenge for PPM is to
optimize the delay in publishing of stream data so that the imprecision bound
for the maximum number of queries is satisfied. We formulate the
precision-bounded access control for privacy-preserving data streams problem,
present the hardness results, provide an <span class=SpellE>anonymization</span>
algorithm, and conduct experimental evaluation of the proposed algorithm.
Experiments demonstrate that the proposed heuristic provides better precision
for a given data stream access control policy as compared to the minimum or
maximum delay heuristics proposed in existing literature.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><span style='font-size:10.0pt'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><span class=SpellE><b><span lang=FR style='font-size:18.0pt;
mso-ansi-language:FR'>Teaching</span></b></span><b><span lang=FR
style='font-size:18.0pt;mso-ansi-language:FR'>, Education, Training, and <span
class=SpellE>Development</span><o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>2011-2012<o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>Education and
Course Design:<o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>In Fall 2011, Aref has offered a graduate-level seminar
class CS698. The purpose of this course is to train students in spatiotemporal
data management research. Students learned the basic and advanced techniques in
spatial and spatiotemporal data management through several interesting
projects. The main class project is to design an introductory <span
class=GramE>level (</span>CS-I) programming course based on spatiotemporal data
management techniques, e.g., using 2D and 3D map and moving objects’
operations. More detail on the CS Programming-I course is given below. In the
class, students covered some of the fundamental papers in spatial and
spatiotemporal data management as well as the useful tools that facilitate
spatial and spatiotemporal data systems research, e.g., data generators,
benchmarks, open source systems, extensible indexing architectures, etc. This
course counts as one of the two CS-698 research courses a Ph.D. student can
take in his/her first three semesters or as a CS590 independent study course.
The class meets once a week on Wednesdays. Each student was expected to give
around two to three presentations over the span of the semester. In addition to
the CS Programming-1 course project that every student is expected to
participate in, each student or possibly a group project of teams of one-three
students each selects a semester-long project. Each student (or each group) was
expected to meet with Walid on individual basis once a week to follow up on the
project’s progress. During class, group discussions evolve around the CS
Programming-I Project following some students' presentations.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>CS Programming-I
Project:<o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>This part of the class involved lots of brainstorming and
design activities. The purpose of this course project is to design an
introductory programming course in computer science to address low retention of
computer science freshman year and their diminished interested in science. The
target is to go beyond the classical 'Hello World' programming examples that
have shown their limits. The goal of this project is to design the CS
Programming I course around 2D and 3D map operations (e.g., using 3D Earth and
2D Map APIs) to increase the interest of students in programming, both in CS
and in Science. According to CRA reports, the interest among undergraduate
students in majoring in Computer Science has decreased significantly.
Universities nationwide have been experiencing a noticeable decline in freshman
registration in CS for the past years. For example, the number of new CS majors
in Fall 2007 was half of what it was in Fall 2000 (15,958 versus 7,915).
Several colleges attribute this decline to the increase in computer literacy
among incoming students and the boring nature of the freshman Programming I
courses. A first program that prints 'Hello World!' on the screen is not
thrilling anymore to students playing computer games with high-quality graphics
since KG. To add excitement, several colleges have redesigned their freshman
Programming I courses to use toy devices, e.g., Robots. The target would be to
program the robot to perform certain tasks while learning various programming
concepts in the process. Although interesting to some students, using robots
has several disadvantages. High setup cost in obtaining and maintaining the
robots is one set back. Another disadvantage is the frustration that many
students have when dealing with hardware as well as software debugging issues
simultaneously. The goal of this project is to design a CS Programming-I course
that uses 2D and 3D maps (e.g., Google Earth and Google Maps) as the ‘toy'
through which freshman CS students learn programming concepts. Besides the low
setup cost, learning using 2D and 3D maps adds the excitement needed by
introducing high-quality graphics and high interactivity by relating the
programming tasks to maps or photos of locations that the students can relate
to. Wrapper APIs needs to be developed to simplify the setup and interaction
with the map software. The new CS Programming-I course needs to be developed
along the same lines of the first CS Programming-1 course at Purdue (CS-180).</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>Education and
Course Design Progress:<o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>11 graduate students (8 males and 3 females) attended the
CS698 class that Aref offered in Fall 2011. Topics covered in class included:</p>

<p class=MsoListParagraphCxSpFirst style='text-indent:-.25in;mso-pagination:
none;mso-list:l3 level1 lfo3;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>-<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]>Dissection of <span class=GramE>Purdue’s Existing</span>
CS-177 &amp; CS-180 introductory CS Programming courses and their exercises.</p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-pagination:
none;mso-list:l3 level1 lfo3;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>-<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]>Study of 2D and 3D Map APIs (e.g., Google’s and
Microsoft products, among others)</p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-pagination:
none;mso-list:l3 level1 lfo3;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>-<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]>Study of spatial and spatiotemporal data operations</p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-pagination:
none;mso-list:l3 level1 lfo3;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>-<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]>What are the basic, minimal, and complete sets of
spatiotemporal operations?</p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-pagination:
none;mso-list:l3 level1 lfo3;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>-<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]>Study of Map and GIS (Geographic Information Systems)
operations</p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-pagination:
none;mso-list:l3 level1 lfo3;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>-<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]>Classic multi-dimensional (spatial) and spatiotemporal
data indexing techniques</p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-pagination:
none;mso-list:l3 level1 lfo3;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>-<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]>Spatial and spatiotemporal query processing algorithms</p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-pagination:
none;mso-list:l3 level1 lfo3;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>-<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]>Spatial and spatiotemporal query optimization</p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-pagination:
none;mso-list:l3 level1 lfo3;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>-<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]>Spatial and spatiotemporal data management systems</p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-pagination:
none;mso-list:l3 level1 lfo3;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>-<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]>Spatiotemporal data streaming systems</p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-pagination:
none;mso-list:l3 level1 lfo3;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>-<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]>Study of publicly available spatial and spatiotemporal
data sets</p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-pagination:
none;mso-list:l3 level1 lfo3;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>-<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]>Synthetic spatiotemporal data generators</p>

<p class=MsoListParagraphCxSpLast style='text-indent:-.25in;mso-pagination:
none;mso-list:l3 level1 lfo3;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>-<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]>Benchmarking spatial and spatiotemporal data systems</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>Student projects in the course included: spatiotemporal
query optimization, a study of publicly available spatial and spatiotemporal
data sets (real and synthetic), parallel spatiotemporal data indexing, distance
oracles, map matching, a study of spatiotemporal data generators. Several 2D-
and 3D-based programming project ideas and programming primitives were
developed for the CS Programming I course. These ideas need further elaboration
and are currently being studied by Walid and his group.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>Training and
Development:<o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>Students have gained research experience in the context of
this project. They have published their results in rigorous conference outlets,
e.g., VLDB, which is one of the two top and most prestigious and competitive
publication venues in the field of database systems (along with the ACM SIGMOD
Conference). Mr. <span class=SpellE>Aly</span> got his paper accepted into VLDB
2012, which was an excellent experience for him as a first publication in his
career. During the graduate seminar course (CS698) that Aref offered in Fall
2011, students (8 males and 3 females) have benefitted tremendously as, through
the class activities, students gave many class presentations about fundamental
ideas and fundamental papers in the field of spatial database systems as well
as cover progress in their class projects. Also, students learned through this
experience how to criticize ideas of others in a balanced fashion, whether
published work of others, or those of their colleagues in the class. Through
this class experience, several students got started in their Ph.D. research,
including Mr. <span class=SpellE>Mahmood</span> and Mr. Tang. Students have
also gained tremendous experience working with large open-source software systems,
e.g., <span class=SpellE>Hadoop</span>. Our M3 project has exposed them to
invaluable software development experience while adapting <span class=SpellE>Hadoop</span>
by eliminating all the disk layers from it and turning it into a massively
distributed and parallel data streaming system. Mr. <span class=SpellE>Aly</span>
was later invited to spend the summer at Microsoft Research where he sharpened
his research skills further.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>2012-2013<o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>Education and
Course Design<o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>Aref has offered over 15 graduate research independent
study courses (CS590, CS698, CS699) in Fall 2012 and Spring 2013. The purpose
of these courses is to train graduate students individually or in small group
in various topics in spatiotemporal data management research. Students learn
advanced topics in spatial and spatiotemporal data management through several interesting
independent study or group projects. Aref currently has 11 Ph.D. students (10
in CS, 1 in ECE) three of which were supported by this grant and one additional
woman Ph.D. student (Ruby <span class=SpellE>Tahboub</span>) will be supported
by this grant as of January 2014. One of the targets of this project's
education plan is to design an introductory programming course in computer
science to address low retention of computer science freshman year and their
diminished interest in science. The target is to go beyond the classical 'Hello
World' programming examples that are not thrilling anymore to students playing
computer games with high-quality graphics since KG. Our goal is to design a CS
Programming-I course that uses 2D and 3D maps (e.g., Google Earth and Google
Maps) as the 'toy' through which freshman CS students learn programming
concepts in contrast to using robots as other programming environments do. Aref
and one Ph.D. student have been working on developing this introductory-level
(CS-I) programming course based on spatiotemporal data management techniques,
e.g., using 2D and 3D map and moving objects' operations. We have focused on
studying several existing introductory programming environments, e.g., <span
class=GramE>Scratch</span> and Alice. We have started developing 2D map-based
programming primitives and abstract operations that serve as building blocks
for the map-based programming language to be developed. Currently, we are using
these primitives to develop some simple programming exercises to serve as a way
to debug these primitives. Once the design of these map primitives and
programming abstractions converge and are finalized, we will start building
these primitives for testing.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>Training and
Development<o:p></o:p></b></p>

<p class=MsoNormal style='margin-bottom:12.0pt;mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'>Students have gained research experience in the
context of this project. They have published their results in rigorous
conference and journal outlets, e.g., the VLDB Journal, the IEEE Transactions
on Knowledge and Data Engineering, the <span class=SpellE>GeoInformatica</span>
Journal, the IEEE <span class=SpellE>BigData</span> Conference, and the VLDB <span
class=SpellE>DBCrowd</span> workshop. Many of the participating students gained
excellent experience as this was their first <span class=GramE>publications</span>
in their careers. During the graduate independent study courses, Ph.D. students
(10 males and 1 female) have benefitted from the various class activities, and
many of them got &quot;jumpstarted&quot; into spatiotemporal data systems
research through systems-oriented projects that resulted into conference and
journal paper submissions.</p>

<p class=MsoNormal style='margin-bottom:12.0pt;mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'>Several students, e.g., Mr. <span class=SpellE>Madkour</span>
and Mr. <span class=SpellE>Mahmood</span> (both were supported under this
project in the 2012/2013 academic year), got their first research papers
accepted into the IEEE <span class=SpellE>BigData</span> 2013 and VLDB <span
class=SpellE>DBCroud</span> 2013, respectively. Students have also gained
experience working with large open-source software systems, e.g., <span
class=SpellE>Hadoop</span> and <span class=SpellE>PostgreSQL</span>. Because of
this experience, four of the Ph.D. students got invited for summer internships
at various industrial and research labs. </p>

<p class=MsoNormal style='margin-bottom:12.0pt;mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'>Post-doctorate Dr. <span class=SpellE>Shen</span> <span
class=SpellE>Zhihong</span> from the Chinese Academy of Sciences has visited
Purdue to collaborate with <span class=SpellE>Aref’s</span> research group at his
government's expenses to get training in the context of this project. Also, Dr.
<span class=SpellE>Saleh</span> <span class=SpellE>Basalamah</span>, Director
of the GIS Technology Innovation Center, Umm Al-<span class=SpellE>Qura</span>
University, Saudi Arabia, has spent an academic year at Purdue to collaborate
in the context of this project. Dr. <span class=SpellE>Basalamah</span> is a
co-author in the <span class=SpellE>DBCrowd</span> 2013 and IEEE <span
class=SpellE>BigData</span> 2013 conference papers.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>Dissemination of
Results to Communities of Interest and Outreach Activities:<o:p></o:p></b></p>

<p class=MsoNormal style='margin-bottom:12.0pt;mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'>In 2012/2013, Aref has offered the over 15
independent graduate research courses, which introduced the topics in the
project to 11 Ph.D. graduate students during the fall and spring semesters
2013. Walid has served as an organization committee member of the Spatial
Computing 2020 Workshop sponsored by NSF/CCC to promote a unified agenda for
Spatial Computing research
(http://cra.org/ccc/visioning/visioning-activities/spatial-computing/196-spatial-computing-workshop),
where Walid was the lead for the Systems track in the workshop. This has
resulted in an article that is currently being submitted to CACM in which Walid
is a co-author. In December 2012, Walid gave a keynote speech at the
International Conference for Connected Vehicles and Expo (Beijing, China) to
reflect advances in spatiotemporal database systems research. Walid continues
to chair the ACM SIGSPATIAL special interest group on spatial algorithms and
systems (2011-2014), where he was one of four founding members of the SIG. </p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'>2013-2014<o:p></o:p></b></p>

<p style='margin:0in;margin-bottom:.0001pt'><b style='mso-bidi-font-weight:
normal'>Education and Course Design<o:p></o:p></b></p>

<p style='margin:0in;margin-bottom:.0001pt'>Aref has offered over 20 graduate and
undergraduate research independent study and theses courses (CS490, CS590,
CS698, CS699) in Fall 2013, and <span class=GramE>Spring</span> and Summer
2014. The purpose of these courses is to train students individually or in
small groups in various topics in spatiotemporal data management research.
Students learn advanced topics in spatial and spatiotemporal data management
through several interesting independent study or group projects including
distributed and parallel spatiotemporal data streaming, benchmarking of
spatiotemporal databases, <span class=SpellE>declustered</span> spatiotemporal
query processing, among many other topics. It is expected that these <span
class=GramE>studies</span> to result in conference papers in the coming
academic year. Aref currently has one Masters Student and 12 Ph.D. students (11
in CS, 1 in ECE) three of which were supported by this grant including one
woman Ph.D. student (Ruby <span class=SpellE>Tahboub</span>). Another woman
Ph.D. student is scheduled to join this project in Spring 2015. Undergraduate
Senior Student Linda <span class=SpellE>Thongsavath</span> did her senior
design project on the topic of benchmarking spatiotemporal databases with deep
query evaluation pipelines.</p>

<p style='margin:0in;margin-bottom:.0001pt'><o:p>&nbsp;</o:p></p>

<p style='margin:0in;margin-bottom:.0001pt'><b style='mso-bidi-font-weight:
normal'><a href="http://www.cs.purdue.edu/homes/aref/papers/limo2014.pdf">LIMO:
A Web-based Environment for Learning Programming using Interactive Map Operations
[Technical Report 2014]</a><o:p></o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'>The computer science education community has placed
tremendous resources to raise interest in computing and improve retention. A
substantial share of these efforts relies on developing innovative programming
environments that target the young-aged group. Along this line, we introduce
LIMO; a web-based environment for learning programming using activities related
to interactive two-dimensional geographical maps and the operations of moving
objects on the maps. An essential aspect of LIMO is that it provides diverse
programming constructs that enable users to process, customize, and visualize
location data on the map. In our view, the integration of interactive maps,
location-based data, and delivering seamless spatial constructs within an
educational programming environment is a very promising direction. We plan to
develop LIMO further with additional spatial and visual constructs to make it
more attractive to novice programmers. We plan to conduct a usability study
that involves novice users to assess the efficacy of using LIMO while learning
programming. Finally, we plan to develop a curriculum for an introductory
computer science course based on LIMO.</p>

<p style='margin:0in;margin-bottom:.0001pt'>Aref and two Ph.D. students have
continued to work on developing LIMO based on spatiotemporal data management
techniques using 2D and 3D map and moving objects' operations. In 2013/2014, we
have developed 2D and 3D map-based programming primitives and abstract
operations around Google Maps and Google Earth. These 2D and 3D map primitives
serve as building blocks for the map-based programming language that we are
currently developing. Currently, we are using these primitives to develop some
simple programming exercises to serve as a way to debug these primitives. To
enrich this map-based programming environment, we integrated an open-source map
database (namely, <span class=SpellE>OpenStreamMap</span>) underneath the
building blocks, so that the building blocks can refer to the underlying
spatial as well as the textual descriptions of the spatial objects (e.g.,
rivers, lakes, shopping centers, etc.). The programming exercises that we
developed gave rise to interesting new research problems that Ph.D. student
Ruby <span class=SpellE>Tahboub</span> is currently studying. </p>

<p style='margin:0in;margin-bottom:.0001pt'><b style='mso-bidi-font-weight:
normal'><o:p>&nbsp;</o:p></b></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b><span lang=FR style='font-size:18.0pt;mso-ansi-language:
FR'>Publications</span></b><b style='mso-bidi-font-weight:normal'><o:p></o:p></b></p>

<p class=MsoListParagraphCxSpFirst style='mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraphCxSpLast style='text-indent:-.25in;mso-pagination:
none;mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>1.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]><a
href="http://www.cs.purdue.edu/homes/aref/papers/vldb2012.pdf">A.M. <span
class=SpellE>Aly</span>, W.G. Aref, M. <span class=SpellE>Ouzzani</span>,
&quot;Spatial Queries with Two <span class=SpellE>kNN</span> Predicates&quot;,
(VLDB 2012). Proceedings of the VLDB Endowment, International Conference on
Very Large Data Bases, p. 1100-1111, vol. 5, Istanbul, Turkey, (2012).</a></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraphCxSpFirst style='text-indent:-.25in;mso-pagination:
none;mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>2.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]><a
href="http://www.cs.purdue.edu/homes/aref/papers/m3-icde2012.pdf">A.M. <span
class=SpellE>Aly</span>, A. <span class=SpellE>Sallam</span>, B.M. <span
class=SpellE>Gnanasekaran</span>, L.-V. Nguyen-<span class=SpellE>Dinh</span>,
W.G. Aref, M. <span class=SpellE>Ouzzani</span>, and A. <span class=SpellE>Ghafoor</span>,
&quot;M3: Stream Processing on Main-Memory <span class=SpellE>MapReduce</span>&quot;,
Proceedings of the 28th International Conference on Data Engineering (ICDE),
Washington DC, (2012).</a></p>

<p class=MsoListParagraphCxSpMiddle style='mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-pagination:
none;mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>3.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]><a
href="http://www.cs.purdue.edu/homes/aref/papers/vldbj2013.pdf">Y.N. Silva,
W.G. Aref, P. Larson, S. Pearson, M.H. Ali: Similarity queries: their
conceptual evaluation, transformations, and processing. VLDB J. 22(3): 395-420
(2013).</a></p>

<p class=MsoListParagraphCxSpMiddle style='mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraphCxSpLast style='text-indent:-.25in;mso-pagination:
none;mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>4.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]><a
href="http://www.cs.purdue.edu/homes/aref/papers/geoinformatica2013.pdf">H.G. <span
class=SpellE>Elmongui</span>, M.F. <span class=SpellE>Mokbel</span>, <span
class=GramE>W.G</span>. Aref: Continuous aggregate nearest neighbor queries. <span
class=SpellE>GeoInformatica</span> 17(1): 63-95 (2013).</a></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>5.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]><a
href="http://www.cs.purdue.edu/homes/aref/papers/dbcrowd2013.pdf">A.R. <span
class=SpellE>Mahmood</span>, W.G. Aref, S.M. <span class=SpellE>Basalamah</span>,
E. <span class=SpellE>Dragut</span>. The Palm-tree Index: Indexing with the
crowd. The VLDB <span class=SpellE>DBCrowd</span> Workshop, 2013.</a> </p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>6.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]><a
href="http://www.cs.purdue.edu/homes/aref/papers/bigdata2013.pdf">A. <span
class=SpellE>Madkour</span>, W.G. Aref, S.M. <span class=SpellE>Basalamah</span>.
Knowledge Cubes - A Proposal for Scalable and <span class=GramE>Semantically-Guided</span>
Management of Big Data. IEEE <span class=SpellE>BigData</span> Conference,
2013.</a></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>7.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]><a
href="http://www.cs.purdue.edu/homes/aref/papers/sigspatial2014.pdf">A.R. <span
class=SpellE>Mahmood</span>, A.M. <span class=SpellE>Aly</span>, W.G. Aref,
S.M. <span class=SpellE>Basalamah</span>. Indexing Recent Trajectories of
Moving Objects. ACM SIGSPATIAL GIS, 2014.</a></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>8.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]><a
href="http://www.cs.purdue.edu/homes/aref/papers/limo2014.pdf">R. <span
class=SpellE>Tahboub</span><span class=GramE>,<span style="mso-spacerun:yes"> 
</span>J</span>. <span class=SpellE>Shen</span>, W.G. Aref, S. <span
class=SpellE>Prabhakar</span>, LIMO: A Web-based Environment for Learning
Programming using Interactive Map Operations. Purdue Computer Science Technical
Report 2014. Submitted for Conference Publication.</a></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>9.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span><![endif]><a
href="http://www.cs.purdue.edu/homes/aref/papers/tkde2014-2.pdf">Z. <span
class=SpellE>Pervaiz</span>, W.G. Aref, A. <span class=SpellE>Ghafoor</span>, <span
class=GramE>N</span>. <span class=SpellE>Prabhu</span>: Accuracy-Constrained
Privacy-Preserving Access Control Mechanism for Relational Data. IEEE Trans. <span
class=SpellE>Knowl</span>. Data Eng. 26(4): 795-807 (2014).</a></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>10.<span style='font:7.0pt "Times New Roman"'>&nbsp; </span></span><![endif]><a
href="http://www.cs.purdue.edu/homes/aref/papers/handsondb-tkde2014.pdf">M.Y. <span
class=SpellE>Eltabakh</span>, W.G. Aref, A.K. <span class=SpellE>Elmagarmid</span>,
M. <span class=SpellE>Ouzzani</span>: <span class=SpellE>HandsOn</span> DB:
Managing Data Dependencies Involving Human Actions. IEEE Trans. <span
class=SpellE>Knowl</span>. Data Eng. 26(9): 2193-2206 (2014).</a></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraphCxSpFirst style='text-indent:-.25in;mso-pagination:
none;mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
class=MsoHyperlink><span style='color:windowtext;text-decoration:none;
text-underline:none'><span style='mso-list:Ignore'>11.<span style='font:7.0pt "Times New Roman"'>&nbsp;
</span></span></span></span><![endif]><a
href="http://www.cs.purdue.edu/homes/aref/papers/edbt2014.pdf">A.M. <span
class=SpellE>Aly</span>, W.G. Aref, M. <span class=SpellE>Ouzzani</span>, H.M.
Mahmoud: JISC: Adaptive Stream Processing Using Just-In-Time State Completion.
EDBT 2014: 73-84.</a><span class=MsoHyperlink><span style='color:windowtext;
text-decoration:none;text-underline:none'><o:p></o:p></span></span></p>

<p class=MsoListParagraphCxSpMiddle style='mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'><span class=MsoHyperlink><span style='color:windowtext;
text-decoration:none;text-underline:none'><o:p>&nbsp;</o:p></span></span></p>

<p class=MsoListParagraphCxSpLast style='text-indent:-.25in;mso-pagination:
none;mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>12.<span style='font:7.0pt "Times New Roman"'>&nbsp; </span></span><![endif]><a
href="http://www.cs.purdue.edu/homes/aref/papers/sisap2014.pdf">W.J. Al <span
class=SpellE>Marri</span>, Q.M. <span class=SpellE>Malluhi</span>, M. <span
class=SpellE>Ouzzani</span>, M. Tang, <span class=GramE>W.G</span>. Aref: The
Similarity-Aware Relational Intersect Database Operator. SISAP 2014: 164-175.
(Best paper award and invited for special issue journal publication).</a></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-list:l2 level1 lfo4'><![if !supportLists]><span
style='color:black'><span style='mso-list:Ignore'>13.<span style='font:7.0pt "Times New Roman"'>&nbsp;
</span></span></span><![endif]><a
href="http://www.cs.purdue.edu/homes/aref/papers/knn-cost-edbt2015.pdf">A.M. <span
class=SpellE>Aly</span>, W.G. Aref, M. <span class=SpellE>Ouzzani</span>, Cost
Estimation of Spatial k-Nearest-Neighbor Operators, EDBT 2015.</a><span
style='mso-fareast-font-family:"ＭＳ 明朝";mso-fareast-theme-font:minor-fareast;
color:black'><o:p></o:p></span></p>

<p class=MsoNormal><span style='mso-fareast-font-family:"ＭＳ 明朝";mso-fareast-theme-font:
minor-fareast;color:black'><o:p>&nbsp;</o:p></span></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>14.<span style='font:7.0pt "Times New Roman"'>&nbsp; </span></span><![endif]>A.M.
<span class=SpellE>Aly</span>, A.S. <span class=SpellE>Abdelhamid</span>, A.R. <span
class=SpellE>Mahmood</span>, W.G. Aref, M.S. Hassan, H. <span class=SpellE>Elmeleegy</span>,
M. <span class=SpellE>Ouzzani</span>&nbsp;(2015).&nbsp;A Demonstration of AQWA:
Adaptive Query-Workload-Aware Partitioning of Big Spatial Data<span
class=GramE>..</span> VLDB, Proceedings of the VLDB.&nbsp; </p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>15.<span style='font:7.0pt "Times New Roman"'>&nbsp; </span></span><![endif]>K.
<span class=SpellE>Mershad</span>, Q.M. <span class=SpellE>Malluhi</span>, M. <span
class=SpellE>Ouzzani</span>, M. Tang, W.G. Aref&nbsp;(2015).&nbsp;Approving
Updates in Collaborative Databases. 2015 IEEE International Conference on Cloud
Engineering.&nbsp; </p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>16.<span style='font:7.0pt "Times New Roman"'>&nbsp; </span></span><![endif]><span
class=SpellE>A.Madkour</span>, W.G. Aref, M. <span class=SpellE>Mokbel</span>,
S. <span class=SpellE>Basalamah</span>&nbsp;(2015).&nbsp;Geo-tagging
Non-Spatial Concepts. ACM SIGSPATIAL <span class=SpellE>MobiGIS</span>
Workshop.&nbsp;</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><span style="mso-spacerun:yes"> </span></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>17.<span style='font:7.0pt "Times New Roman"'>&nbsp; </span></span><![endif]>A.M.
<span class=SpellE>Aly</span>, H. <span class=SpellE>Elmeleegy</span>, Y. Qi,
W.G. Aref&nbsp;(2016).&nbsp;Kangaroo: Workload-Aware Processing of Range Data
and Range Queries in <span class=SpellE>Hadoop</span>. 9th ACM International
Conference on Web Search and Data Mining (WSDM).&nbsp;Status = ACCEPTED.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>18.<span style='font:7.0pt "Times New Roman"'>&nbsp; </span></span><![endif]>R.Y.
<span class=SpellE>Tahboub</span>, J. Shin, <span class=SpellE>Aya</span> <span
class=SpellE>Abdelsalam</span>, J.W. Aref, W.G. Aref, S. <span class=SpellE>Prabhakar</span>&nbsp;(2015).&nbsp;LIMO:
Learning Programming using Interactive Map Activities (Demo Paper). ACM
SIGSPATIAL. Status = ACCEPTED.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><span style="mso-spacerun:yes"> </span></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>19.<span style='font:7.0pt "Times New Roman"'>&nbsp; </span></span><![endif]>M.
Tang, W.G. Aref, Q.M. <span class=SpellE>Malluhi</span>, <span class=GramE>M. <span
class=SpellE>Ouzzani</span></span>&nbsp;(2015).&nbsp;<span class=SpellE>MingJie</span>
Tang, <span class=SpellE>Yongyang</span> Yu, Walid G. Aref, <span class=SpellE>Qutaibah</span>
M. <span class=SpellE>Malluhi</span>, <span class=SpellE>Mourad</span> <span
class=SpellE>Ouzzani</span>: Efficient Processing of Hamming-Distance-Based
Similarity-Search Queries Over <span class=SpellE>MapReduce</span><span
class=GramE>..</span> EDBT 2015: 361-372.&nbsp;</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>20.<span style='font:7.0pt "Times New Roman"'>&nbsp; </span></span><![endif]>W.G.
Aref, S. <span class=SpellE>Prabhakar</span>, J. Shin, R.Y. <span class=SpellE>Tahboub</span>,
A. <span class=SpellE>Abdelsalam</span>, J.W. Aref&nbsp;(2015).&nbsp;On
Map-Centric Programming Environments (Vision Paper). ACM SIGSPATIAL.&nbsp;
Status = ACCEPTED.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><span style="mso-spacerun:yes"> </span></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>21.<span style='font:7.0pt "Times New Roman"'>&nbsp; </span></span><![endif]><span
class=SpellE>Mingjie</span> Tang, Ruby <span class=SpellE>Tahboub</span>, Walid
G. Aref, Michael <span class=SpellE>Atallah</span>, Michael <span class=SpellE>Gribskov</span>,
<span class=SpellE>Qutaibah</span> <span class=SpellE>Malluhi</span>, <span
class=SpellE>Mourad</span> <span class=SpellE>Ouzzani</span>, <span
class=SpellE>Yasin</span> Silva&nbsp;(2015).&nbsp;Similarity Group-by Operators
for Multi-dimensional Relational Data<span class=GramE>..</span> IEEE
Transactions on Knowledge and Data Engineering.&nbsp;Status = ACCEPTED.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><span style="mso-spacerun:yes"> </span></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>22.<span style='font:7.0pt "Times New Roman"'>&nbsp; </span></span><![endif]>A.M.
<span class=SpellE>Aly</span>, W.G. Aref, M. <span class=SpellE>Ouzzani</span>&nbsp;(2015).&nbsp;Spatial
Queries with k-Nearest-Neighbor and Relational Predicates. ACM SIGSPATIAL.&nbsp;Status
= ACCEPTED. </p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>23.<span style='font:7.0pt "Times New Roman"'>&nbsp; </span></span><![endif]>A.R.
<span class=SpellE>Mahmood</span>, A.M. <span class=SpellE>Aly</span>, T. <span
class=SpellE>Qadah</span>, A. <span class=SpellE>Madkour</span>, A.S. <span
class=SpellE>Abdelhamid</span>, M.S. Hassan, W.G. Aref, S. <span class=SpellE>Basalamah</span>&nbsp;(2015).&nbsp;Tornado:
A Distributed <span class=SpellE>Spatio</span>-Textual Stream Processing
System. VLDB, Proceedings of the VLDB.&nbsp;Status = PUBLISHED.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>24.<span style='font:7.0pt "Times New Roman"'>&nbsp; </span></span><![endif]><span
class=SpellE>Wadha</span> J. Al <span class=SpellE>Marri</span> and <span
class=SpellE>Qutaibah</span> <span class=SpellE>Malluhi</span>, <span
class=SpellE>Mourad</span> <span class=SpellE>Ouzzani</span>, <span
class=SpellE>Mingjie</span> Tang and Walid G. Aref&nbsp;(2015).&nbsp;The
Similarity-aware Relational Database Set Operators.&nbsp; Information Systems
Journal.&nbsp; Status = ACCEPTED.</p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>25.<span style='font:7.0pt "Times New Roman"'>&nbsp; </span></span><![endif]>Z.
<span class=SpellE>Pervaiz</span>, A. <span class=SpellE>Ghafoor</span>, W.G.
Aref:&nbsp;(2015).&nbsp;Precision-Bounded Access Control Using Sliding-Window
Query Views for Privacy-Preserving Data Streams<span class=GramE>..</span>&nbsp;
IEEE Trans. <span class=SpellE>Knowl</span>. Data Eng<span class=GramE>..</span>&nbsp;27&nbsp;(7)<span
class=GramE>, &nbsp;1992</span>-2004. </p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraphCxSpFirst style='text-indent:-.25in;mso-list:l2 level1 lfo4'><![if !supportLists]><span
style='mso-list:Ignore'>26.<span style='font:7.0pt "Times New Roman"'>&nbsp; </span></span><![endif]><a
href="https://www.cs.purdue.edu/homes/aref/papers/sigmod2016.pdf">M.S. Hassan,
A.M. <span class=SpellE>Aly</span>, W.G. Aref, Graph Indexing for Shortest-Path
Finding over Dynamic Sub-Graphs, ACM SIGMOD 2016 (Full Paper). </a><o:p></o:p></p>

<p class=MsoListParagraphCxSpMiddle><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-pagination:
none;mso-list:l2 level1 lfo4;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='mso-list:Ignore'>27.<span style='font:7.0pt "Times New Roman"'>&nbsp; </span></span><![endif]><a
href="http://www.cs.purdue.edu/homes/aref/papers/aqwa2015.pdf">A.M. <span
class=SpellE>Aly</span>, M.S. Hassan, A.R. <span class=SpellE>Mahmood</span>,
W.G. Aref, H. <span class=SpellE>Elmeleegy</span>, M. <span class=SpellE>Ouzzani</span>,
AQWA: Adaptive Query-Workload-Aware Partitioning of Big Spatial Data, VLDB 2016
(Full Paper).</a><o:p></o:p></p>

<p class=MsoListParagraphCxSpMiddle style='mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-list:l2 level1 lfo4'><![if !supportLists]><span
style='mso-list:Ignore'>28.<span style='font:7.0pt "Times New Roman"'>&nbsp; </span></span><![endif]><a
href="https://www.cs.purdue.edu/homes/aref/papers/tkde2015-similarity-group-operators.pdf">M.
Tang, R.Y. <span class=SpellE>Tahboub</span>, W.G. Aref, M.J. <span
class=SpellE>Atallah</span>, Q.M. <span class=SpellE>Malluhi</span>, M. <span
class=SpellE>Ouzzani</span>, Y.N. Silva: Similarity Group-by Operators for
Multi-Dimensional Relational Data. IEEE Trans. <span class=SpellE>Knowl</span>.
Data Eng. 28(2): 510-523 (2016).</a><o:p></o:p></p>

<p class=MsoListParagraphCxSpMiddle><span style='mso-fareast-font-family:"ＭＳ 明朝";
mso-fareast-theme-font:minor-fareast;color:black'><o:p>&nbsp;</o:p></span></p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-list:l2 level1 lfo4'><![if !supportLists]><span
style='mso-list:Ignore'>29.<span style='font:7.0pt "Times New Roman"'>&nbsp; </span></span><![endif]><a
href="http://dl.acm.org/citation.cfm?doid=2756547"><span class=SpellE>Shashi</span>
<span class=SpellE>Shekhar</span>, Steven K. <span class=SpellE>Feiner</span>, <span
class=GramE>Walid</span> G. Aref: Spatial computing. Communications of the ACM
59(1): 72-81 (2016).</a><o:p></o:p></p>

<p class=MsoListParagraphCxSpMiddle><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-list:l2 level1 lfo4'><![if !supportLists]><span
style='mso-list:Ignore'>30.<span style='font:7.0pt "Times New Roman"'>&nbsp; </span></span><![endif]><a
href="https://www.cs.purdue.edu/homes/aref/papers/icde2016-cruncher.pdf">A.S. <span
class=SpellE>Abdelhamid</span>, M. Tang, A.M. <span class=SpellE>Aly</span>,
A.R. <span class=SpellE>Mahmood</span>, T. <span class=SpellE>Qadah</span>,
W.G. Aref, <span class=SpellE>S.Basalamah</span>. Cruncher: Distributed
In-Memory Processing for Location-Based Services. IEEE ICDE 2016, Demo paper.</a><o:p></o:p></p>

<p class=MsoListParagraphCxSpMiddle><o:p>&nbsp;</o:p></p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-list:l2 level1 lfo4'><![if !supportLists]><span
style='mso-list:Ignore'>31.<span style='font:7.0pt "Times New Roman"'>&nbsp; </span></span><![endif]><a
href="https://www.cs.purdue.edu/homes/aref/papers/icde2016-elkindi.pdf">El <span
class=SpellE>Kindi</span> <span class=SpellE>Rezig</span>, Eduard C. <span
class=SpellE>Dragut</span>, <span class=SpellE>Mourad</span> <span
class=SpellE>Ouzzani</span>, Ahmed K. <span class=SpellE>Elmagarmid</span>,
Walid G. Aref. ORLF: A Flexible Framework for Online Record Linkage and Fusion.
IEEE ICDE 2016, Demo paper.</a><o:p></o:p></p>

<p class=MsoListParagraphCxSpLast style='mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'><o:p>&nbsp;</o:p></p>

<p style='margin-bottom:0in;margin-bottom:.0001pt;mso-outline-level:1'><span
class=SpellE><b><span lang=FR style='font-size:18.0pt;mso-ansi-language:FR'>Collaborators</span></b></span><b><span
lang=FR style='font-size:18.0pt;mso-ansi-language:FR'>:<o:p></o:p></span></b></p>

<p class=MsoListParagraphCxSpFirst style='text-indent:-.25in;mso-pagination:
none;mso-list:l4 level1 lfo5;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='font-size:10.0pt;font-family:Symbol;mso-fareast-font-family:Symbol;
mso-bidi-font-family:Symbol'><span style='mso-list:Ignore'>·<span
style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><![endif]><b
style='mso-bidi-font-weight:normal'><span style='font-size:10.0pt'>Dr. Paul
Larson</span></b><span style='font-size:10.0pt'>: Microsoft Research, Redmond,
WA collaborated in writing a research paper [VLDBJ2013] that provides
foundational research for the correctness ideas in this grant.<o:p></o:p></span></p>

<p class=MsoListParagraphCxSpMiddle style='mso-pagination:none;mso-layout-grid-align:
none;text-autospace:none'><span style='font-size:10.0pt'><o:p>&nbsp;</o:p></span></p>

<p class=MsoListParagraphCxSpLast style='text-indent:-.25in;mso-pagination:
none;mso-list:l4 level1 lfo5;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='font-size:10.0pt;font-family:Symbol;mso-fareast-font-family:Symbol;
mso-bidi-font-family:Symbol'><span style='mso-list:Ignore'>·<span
style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><![endif]><b
style='mso-bidi-font-weight:normal'><span style='font-size:10.0pt'>Dr. M.H. Ali</span></b><span
style='font-size:10.0pt'>: Microsoft Corporation, Redmond, Washington,
collaborated in writing a research paper [VLDBJ2013] that provides foundational
research for the correctness ideas in this grant.<o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span
style='font-size:10.0pt'><o:p>&nbsp;</o:p></span></b></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l4 level1 lfo5;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='font-size:10.0pt;font-family:Symbol;mso-fareast-font-family:Symbol;
mso-bidi-font-family:Symbol'><span style='mso-list:Ignore'>·<span
style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><![endif]><b
style='mso-bidi-font-weight:normal'><span style='font-size:10.0pt'>Dr. <span
class=SpellE>Hicham</span> <span class=SpellE>Elmongui</span></span></b><span
style='font-size:10.0pt'>: Amazon, collaborated in writing a research paper
[GeoInformatica2013] that presents algorithms for efficiently evaluation
aggregate nearest neighbor queries.<o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span
style='font-size:10.0pt'><o:p>&nbsp;</o:p></span></b></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l4 level1 lfo5;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='font-size:10.0pt;font-family:Symbol;mso-fareast-font-family:Symbol;
mso-bidi-font-family:Symbol'><span style='mso-list:Ignore'>·<span
style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><![endif]><b
style='mso-bidi-font-weight:normal'><span style='font-size:10.0pt'>Prof. </span></b><b
style='mso-bidi-font-weight:normal'><span style='font-size:10.5pt'>M. <span
class=SpellE>Eltabakh</span></span></b><span style='font-size:10.5pt'>: WPI,
Massachusetts, collaborated in writing a research paper [IEEE TKDE 2014] that
presents models and techniques for integrating human activities into database
systems.</span><span style='font-size:10.0pt'><o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span
style='font-size:10.0pt'><o:p>&nbsp;</o:p></span></b></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l4 level1 lfo5;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='font-size:10.0pt;font-family:Symbol;mso-fareast-font-family:Symbol;
mso-bidi-font-family:Symbol'><span style='mso-list:Ignore'>·<span
style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><![endif]><b
style='mso-bidi-font-weight:normal'><span style='font-size:10.0pt'>Graduate
Students: </span></b><span style='font-size:10.0pt'>A. <span class=SpellE>Aly</span>
(5<sup>th</sup> year Ph.D. student), M. Tang (4<sup>th</sup> year Ph.D. student),
A. <span class=SpellE>Mahmood</span> (4<sup>th</sup> year Ph.D. student), R. <span
class=SpellE>Tahboub</span> (4<sup>th</sup> year Ph.D. student), A. <span
class=SpellE>Madkour</span> (4<sup>th</sup> year Ph.D. student), M. Hassan (2<sup>nd</sup>
year Ph.D. student) were funded at different periods under this grant and
worked at various aspects of this projects.<o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span
style='font-size:10.0pt'><o:p>&nbsp;</o:p></span></b></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l4 level1 lfo5;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='font-size:10.0pt;font-family:Symbol;mso-fareast-font-family:Symbol;
mso-bidi-font-family:Symbol'><span style='mso-list:Ignore'>·<span
style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><![endif]><b
style='mso-bidi-font-weight:normal'><span style='font-size:10.0pt'>S. Pearson</span></b><span
style='font-size:10.0pt'>: Graduate student at Arizona State who collaborated
in the context of generalizing the results in this project for similarity-based
databases. Mr. Pearson conducted experiments requested by the reviewers in
order to revise the submitted paper that was later accepted to appear in the
VLDB Journal [VLDBJ2013].<o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span
style='font-size:10.0pt'><o:p>&nbsp;</o:p></span></b></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l4 level1 lfo5;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='font-size:10.0pt;font-family:Symbol;mso-fareast-font-family:Symbol;
mso-bidi-font-family:Symbol'><span style='mso-list:Ignore'>·<span
style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><![endif]><b
style='mso-bidi-font-weight:normal'><span style='font-size:10.0pt'>B. Coffey</span></b><span
style='font-size:10.0pt'>: Graduate student at Purdue University who
collaborated in the context of collecting meta-data about publicly available
spatial data sets. <o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span
style='font-size:10.0pt'><o:p>&nbsp;</o:p></span></b></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l4 level1 lfo5;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='font-size:10.0pt;font-family:Symbol;mso-fareast-font-family:Symbol;
mso-bidi-font-family:Symbol'><span style='mso-list:Ignore'>·<span
style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><![endif]><b
style='mso-bidi-font-weight:normal'><span style='font-size:10.0pt'>Undergraduate
Students</span></b><span style='font-size:10.0pt'>: <b style='mso-bidi-font-weight:
normal'>Linda <span class=SpellE>Thongsavath</span>:</b> Undergraduate student
at Purdue University who collaborated in the context of realizing a benchmark
for spatiotemporal databases that use k-nearest neighbors in multi-predicate
queries that include relational, spatial, and <span class=SpellE>kNN</span>
predicates.<o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span
style='font-size:10.0pt'><o:p>&nbsp;</o:p></span></b></p>

<p class=MsoListParagraph style='text-indent:-.25in;mso-pagination:none;
mso-list:l4 level1 lfo5;mso-layout-grid-align:none;text-autospace:none'><![if !supportLists]><span
style='font-size:10.0pt;font-family:Symbol;mso-fareast-font-family:Symbol;
mso-bidi-font-family:Symbol'><span style='mso-list:Ignore'>·<span
style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp; </span></span></span><![endif]><b
style='mso-bidi-font-weight:normal'><span style='font-size:10.0pt'>Visitors and
Post-docs</span></b><span style='font-size:10.0pt'>:<o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span
style='font-size:10.0pt'><o:p>&nbsp;</o:p></span></b></p>

<p class=MsoListParagraphCxSpFirst style='margin-left:1.0in;mso-add-space:auto;
text-indent:-.25in;mso-pagination:none;mso-list:l4 level2 lfo5;mso-layout-grid-align:
none;text-autospace:none'><![if !supportLists]><span style='font-size:10.0pt;
font-family:"Courier New";mso-fareast-font-family:"Courier New"'><span
style='mso-list:Ignore'>o<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;
</span></span></span><![endif]><b style='mso-bidi-font-weight:normal'><span
style='font-size:10.0pt'>Dr. <span class=SpellE>Shen</span> <span class=SpellE>Zhihong</span>:</span></b><span
style='font-size:10.0pt'> Chinese Academy of Sciences, Beijing, China (August
2013- October 2013) participated in designing cluster-based user workspaces. <o:p></o:p></span></p>

<p class=MsoListParagraphCxSpMiddle style='margin-left:1.0in;mso-add-space:
auto;mso-pagination:none;mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:10.0pt'><o:p>&nbsp;</o:p></span></p>

<p class=MsoListParagraphCxSpLast style='margin-left:1.0in;mso-add-space:auto;
text-indent:-.25in;mso-pagination:none;mso-list:l4 level2 lfo5;mso-layout-grid-align:
none;text-autospace:none'><![if !supportLists]><span style='font-size:10.0pt;
font-family:"Courier New";mso-fareast-font-family:"Courier New"'><span
style='mso-list:Ignore'>o<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;
</span></span></span><![endif]><b style='mso-bidi-font-weight:normal'><span
style='font-size:10.0pt'>Dr. <span class=SpellE>Saleh</span> <span
class=SpellE>Basalamah</span></span></b><span style='font-size:10.0pt'>:
Director of the GIS Technology Innovation Center, Umm Al-<span class=SpellE>Qura</span>
University, Saudi Arabia (April 2013-Present), participated in coauthoring
multiple research papers, including [DBCrowd2013], [IEEE <span class=SpellE>BigData</span>
2013], and [ACM SIGSPATIAL 2014].<o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><b style='mso-bidi-font-weight:normal'><span
style='font-size:10.0pt'><o:p>&nbsp;</o:p></span></b></p>

<p class=MsoListParagraph style='margin-left:1.0in;mso-add-space:auto;
text-indent:-.25in;mso-pagination:none;mso-list:l4 level2 lfo5;mso-layout-grid-align:
none;text-autospace:none'><![if !supportLists]><span style='font-size:10.0pt;
font-family:"Courier New";mso-fareast-font-family:"Courier New"'><span
style='mso-list:Ignore'>o<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;
</span></span></span><![endif]><b style='mso-bidi-font-weight:normal'><span
style='font-size:10.0pt'>Dr. Eduard <span class=SpellE>Dragut</span></span></b><span
style='font-size:10.0pt'>: Dr. <span class=SpellE>Dragut</span> was a post-doc
at Purdue University during 2012-2013 and participated in the context of this
project in the cloud sourcing indexing paper [<span class=SpellE>DBCrowd</span>
2013].<o:p></o:p></span></p>

<p class=MsoNormal style='mso-pagination:none;mso-layout-grid-align:none;
text-autospace:none'><span style='font-size:10.5pt'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-outline-level:1'>&nbsp;</p>

</div>

</body>

</html>