<html xmlns:v="urn:schemas-microsoft-com:vml"
xmlns:o="urn:schemas-microsoft-com:office:office"
xmlns:w="urn:schemas-microsoft-com:office:word"
xmlns:m="http://schemas.microsoft.com/office/2004/12/omml"
xmlns="http://www.w3.org/TR/REC-html40" xmlns:ns0="http://macVmlSchemaUri">

<head>
<meta http-equiv=Content-Type content="text/html; charset=unicode">
<meta name=ProgId content=Word.Document>
<meta name=Generator content="Microsoft Word 15">
<meta name=Originator content="Microsoft Word 15">
<link rel=File-List href="index_files/filelist.xml">
<!--[if gte mso 9]><xml>
 <o:DocumentProperties>
  <o:Author>Walid G Aref</o:Author>
  <o:LastAuthor>Walid G. Aref</o:LastAuthor>
  <o:Revision>18</o:Revision>
  <o:TotalTime>3097</o:TotalTime>
  <o:Created>2018-07-02T23:01:00Z</o:Created>
  <o:LastSaved>2023-12-10T08:20:00Z</o:LastSaved>
  <o:Pages>17</o:Pages>
  <o:Words>9240</o:Words>
  <o:Characters>52673</o:Characters>
  <o:Lines>438</o:Lines>
  <o:Paragraphs>123</o:Paragraphs>
  <o:CharactersWithSpaces>61790</o:CharactersWithSpaces>
  <o:Version>16.00</o:Version>
 </o:DocumentProperties>
 <o:OfficeDocumentSettings>
  <o:AllowPNG/>
 </o:OfficeDocumentSettings>
</xml><![endif]-->
<link rel=themeData href="index_files/themedata.thmx">
<link rel=colorSchemeMapping href="index_files/colorschememapping.xml">
<!--[if gte mso 9]><xml>
 <w:WordDocument>
  <w:View>Print</w:View>
  <w:Zoom>204</w:Zoom>
  <w:SpellingState>Clean</w:SpellingState>
  <w:GrammarState>Clean</w:GrammarState>
  <w:TrackMoves>false</w:TrackMoves>
  <w:TrackFormatting/>
  <w:PunctuationKerning/>
  <w:ValidateAgainstSchemas/>
  <w:SaveIfXMLInvalid>false</w:SaveIfXMLInvalid>
  <w:IgnoreMixedContent>false</w:IgnoreMixedContent>
  <w:AlwaysShowPlaceholderText>false</w:AlwaysShowPlaceholderText>
  <w:DoNotPromoteQF/>
  <w:LidThemeOther>EN-US</w:LidThemeOther>
  <w:LidThemeAsian>X-NONE</w:LidThemeAsian>
  <w:LidThemeComplexScript>AR-SA</w:LidThemeComplexScript>
  <w:Compatibility>
   <w:BreakWrappedTables/>
   <w:SnapToGridInCell/>
   <w:WrapTextWithPunct/>
   <w:UseAsianBreakRules/>
   <w:DontGrowAutofit/>
   <w:SplitPgBreakAndParaMark/>
   <w:EnableOpenTypeKerning/>
   <w:DontFlipMirrorIndents/>
   <w:OverrideTableStyleHps/>
  </w:Compatibility>
  <w:BrowserLevel>MicrosoftInternetExplorer4</w:BrowserLevel>
  <m:mathPr>
   <m:mathFont m:val="Cambria Math"/>
   <m:brkBin m:val="before"/>
   <m:brkBinSub m:val="&#45;-"/>
   <m:smallFrac m:val="off"/>
   <m:dispDef/>
   <m:lMargin m:val="0"/>
   <m:rMargin m:val="0"/>
   <m:defJc m:val="centerGroup"/>
   <m:wrapIndent m:val="1440"/>
   <m:intLim m:val="subSup"/>
   <m:naryLim m:val="undOvr"/>
  </m:mathPr></w:WordDocument>
</xml><![endif]--><!--[if gte mso 9]><xml>
 <w:LatentStyles DefLockedState="false" DefUnhideWhenUsed="false"
  DefSemiHidden="false" DefQFormat="false" DefPriority="99"
  LatentStyleCount="376">
  <w:LsdException Locked="false" Priority="0" QFormat="true" Name="Normal"/>
  <w:LsdException Locked="false" Priority="9" QFormat="true" Name="heading 1"/>
  <w:LsdException Locked="false" Priority="9" SemiHidden="true"
   UnhideWhenUsed="true" QFormat="true" Name="heading 2"/>
  <w:LsdException Locked="false" Priority="9" SemiHidden="true"
   UnhideWhenUsed="true" QFormat="true" Name="heading 3"/>
  <w:LsdException Locked="false" Priority="9" SemiHidden="true"
   UnhideWhenUsed="true" QFormat="true" Name="heading 4"/>
  <w:LsdException Locked="false" Priority="9" SemiHidden="true"
   UnhideWhenUsed="true" QFormat="true" Name="heading 5"/>
  <w:LsdException Locked="false" Priority="9" SemiHidden="true"
   UnhideWhenUsed="true" QFormat="true" Name="heading 6"/>
  <w:LsdException Locked="false" Priority="9" SemiHidden="true"
   UnhideWhenUsed="true" QFormat="true" Name="heading 7"/>
  <w:LsdException Locked="false" Priority="9" SemiHidden="true"
   UnhideWhenUsed="true" QFormat="true" Name="heading 8"/>
  <w:LsdException Locked="false" Priority="9" SemiHidden="true"
   UnhideWhenUsed="true" QFormat="true" Name="heading 9"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="index 1"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="index 2"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="index 3"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="index 4"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="index 5"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="index 6"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="index 7"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="index 8"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="index 9"/>
  <w:LsdException Locked="false" Priority="39" SemiHidden="true"
   UnhideWhenUsed="true" Name="toc 1"/>
  <w:LsdException Locked="false" Priority="39" SemiHidden="true"
   UnhideWhenUsed="true" Name="toc 2"/>
  <w:LsdException Locked="false" Priority="39" SemiHidden="true"
   UnhideWhenUsed="true" Name="toc 3"/>
  <w:LsdException Locked="false" Priority="39" SemiHidden="true"
   UnhideWhenUsed="true" Name="toc 4"/>
  <w:LsdException Locked="false" Priority="39" SemiHidden="true"
   UnhideWhenUsed="true" Name="toc 5"/>
  <w:LsdException Locked="false" Priority="39" SemiHidden="true"
   UnhideWhenUsed="true" Name="toc 6"/>
  <w:LsdException Locked="false" Priority="39" SemiHidden="true"
   UnhideWhenUsed="true" Name="toc 7"/>
  <w:LsdException Locked="false" Priority="39" SemiHidden="true"
   UnhideWhenUsed="true" Name="toc 8"/>
  <w:LsdException Locked="false" Priority="39" SemiHidden="true"
   UnhideWhenUsed="true" Name="toc 9"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Normal Indent"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="footnote text"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="annotation text"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="header"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="footer"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="index heading"/>
  <w:LsdException Locked="false" Priority="35" SemiHidden="true"
   UnhideWhenUsed="true" QFormat="true" Name="caption"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="table of figures"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="envelope address"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="envelope return"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="footnote reference"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="annotation reference"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="line number"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="page number"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="endnote reference"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="endnote text"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="table of authorities"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="macro"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="toa heading"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="List"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="List Bullet"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="List Number"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="List 2"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="List 3"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="List 4"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="List 5"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="List Bullet 2"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="List Bullet 3"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="List Bullet 4"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="List Bullet 5"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="List Number 2"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="List Number 3"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="List Number 4"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="List Number 5"/>
  <w:LsdException Locked="false" Priority="10" QFormat="true" Name="Title"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Closing"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Signature"/>
  <w:LsdException Locked="false" Priority="1" SemiHidden="true"
   UnhideWhenUsed="true" Name="Default Paragraph Font"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Body Text"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Body Text Indent"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="List Continue"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="List Continue 2"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="List Continue 3"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="List Continue 4"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="List Continue 5"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Message Header"/>
  <w:LsdException Locked="false" Priority="11" QFormat="true" Name="Subtitle"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Salutation"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Date"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Body Text First Indent"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Body Text First Indent 2"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Note Heading"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Body Text 2"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Body Text 3"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Body Text Indent 2"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Body Text Indent 3"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Block Text"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Hyperlink"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="FollowedHyperlink"/>
  <w:LsdException Locked="false" Priority="22" QFormat="true" Name="Strong"/>
  <w:LsdException Locked="false" Priority="20" QFormat="true" Name="Emphasis"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Document Map"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Plain Text"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="E-mail Signature"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="HTML Top of Form"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="HTML Bottom of Form"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Normal (Web)"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="HTML Acronym"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="HTML Address"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="HTML Cite"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="HTML Code"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="HTML Definition"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="HTML Keyboard"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="HTML Preformatted"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="HTML Sample"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="HTML Typewriter"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="HTML Variable"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Normal Table"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="annotation subject"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="No List"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Outline List 1"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Outline List 2"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Outline List 3"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Simple 1"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Simple 2"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Simple 3"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Classic 1"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Classic 2"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Classic 3"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Classic 4"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Colorful 1"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Colorful 2"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Colorful 3"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Columns 1"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Columns 2"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Columns 3"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Columns 4"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Columns 5"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Grid 1"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Grid 2"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Grid 3"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Grid 4"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Grid 5"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Grid 6"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Grid 7"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Grid 8"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table List 1"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table List 2"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table List 3"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table List 4"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table List 5"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table List 6"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table List 7"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table List 8"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table 3D effects 1"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table 3D effects 2"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table 3D effects 3"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Contemporary"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Elegant"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Professional"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Subtle 1"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Subtle 2"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Web 1"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Web 2"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Web 3"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Balloon Text"/>
  <w:LsdException Locked="false" Priority="39" Name="Table Grid"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Table Theme"/>
  <w:LsdException Locked="false" SemiHidden="true" Name="Placeholder Text"/>
  <w:LsdException Locked="false" Priority="1" QFormat="true" Name="No Spacing"/>
  <w:LsdException Locked="false" Priority="60" Name="Light Shading"/>
  <w:LsdException Locked="false" Priority="61" Name="Light List"/>
  <w:LsdException Locked="false" Priority="62" Name="Light Grid"/>
  <w:LsdException Locked="false" Priority="63" Name="Medium Shading 1"/>
  <w:LsdException Locked="false" Priority="64" Name="Medium Shading 2"/>
  <w:LsdException Locked="false" Priority="65" Name="Medium List 1"/>
  <w:LsdException Locked="false" Priority="66" Name="Medium List 2"/>
  <w:LsdException Locked="false" Priority="67" Name="Medium Grid 1"/>
  <w:LsdException Locked="false" Priority="68" Name="Medium Grid 2"/>
  <w:LsdException Locked="false" Priority="69" Name="Medium Grid 3"/>
  <w:LsdException Locked="false" Priority="70" Name="Dark List"/>
  <w:LsdException Locked="false" Priority="71" Name="Colorful Shading"/>
  <w:LsdException Locked="false" Priority="72" Name="Colorful List"/>
  <w:LsdException Locked="false" Priority="73" Name="Colorful Grid"/>
  <w:LsdException Locked="false" Priority="60" Name="Light Shading Accent 1"/>
  <w:LsdException Locked="false" Priority="61" Name="Light List Accent 1"/>
  <w:LsdException Locked="false" Priority="62" Name="Light Grid Accent 1"/>
  <w:LsdException Locked="false" Priority="63" Name="Medium Shading 1 Accent 1"/>
  <w:LsdException Locked="false" Priority="64" Name="Medium Shading 2 Accent 1"/>
  <w:LsdException Locked="false" Priority="65" Name="Medium List 1 Accent 1"/>
  <w:LsdException Locked="false" SemiHidden="true" Name="Revision"/>
  <w:LsdException Locked="false" Priority="34" QFormat="true"
   Name="List Paragraph"/>
  <w:LsdException Locked="false" Priority="29" QFormat="true" Name="Quote"/>
  <w:LsdException Locked="false" Priority="30" QFormat="true"
   Name="Intense Quote"/>
  <w:LsdException Locked="false" Priority="66" Name="Medium List 2 Accent 1"/>
  <w:LsdException Locked="false" Priority="67" Name="Medium Grid 1 Accent 1"/>
  <w:LsdException Locked="false" Priority="68" Name="Medium Grid 2 Accent 1"/>
  <w:LsdException Locked="false" Priority="69" Name="Medium Grid 3 Accent 1"/>
  <w:LsdException Locked="false" Priority="70" Name="Dark List Accent 1"/>
  <w:LsdException Locked="false" Priority="71" Name="Colorful Shading Accent 1"/>
  <w:LsdException Locked="false" Priority="72" Name="Colorful List Accent 1"/>
  <w:LsdException Locked="false" Priority="73" Name="Colorful Grid Accent 1"/>
  <w:LsdException Locked="false" Priority="60" Name="Light Shading Accent 2"/>
  <w:LsdException Locked="false" Priority="61" Name="Light List Accent 2"/>
  <w:LsdException Locked="false" Priority="62" Name="Light Grid Accent 2"/>
  <w:LsdException Locked="false" Priority="63" Name="Medium Shading 1 Accent 2"/>
  <w:LsdException Locked="false" Priority="64" Name="Medium Shading 2 Accent 2"/>
  <w:LsdException Locked="false" Priority="65" Name="Medium List 1 Accent 2"/>
  <w:LsdException Locked="false" Priority="66" Name="Medium List 2 Accent 2"/>
  <w:LsdException Locked="false" Priority="67" Name="Medium Grid 1 Accent 2"/>
  <w:LsdException Locked="false" Priority="68" Name="Medium Grid 2 Accent 2"/>
  <w:LsdException Locked="false" Priority="69" Name="Medium Grid 3 Accent 2"/>
  <w:LsdException Locked="false" Priority="70" Name="Dark List Accent 2"/>
  <w:LsdException Locked="false" Priority="71" Name="Colorful Shading Accent 2"/>
  <w:LsdException Locked="false" Priority="72" Name="Colorful List Accent 2"/>
  <w:LsdException Locked="false" Priority="73" Name="Colorful Grid Accent 2"/>
  <w:LsdException Locked="false" Priority="60" Name="Light Shading Accent 3"/>
  <w:LsdException Locked="false" Priority="61" Name="Light List Accent 3"/>
  <w:LsdException Locked="false" Priority="62" Name="Light Grid Accent 3"/>
  <w:LsdException Locked="false" Priority="63" Name="Medium Shading 1 Accent 3"/>
  <w:LsdException Locked="false" Priority="64" Name="Medium Shading 2 Accent 3"/>
  <w:LsdException Locked="false" Priority="65" Name="Medium List 1 Accent 3"/>
  <w:LsdException Locked="false" Priority="66" Name="Medium List 2 Accent 3"/>
  <w:LsdException Locked="false" Priority="67" Name="Medium Grid 1 Accent 3"/>
  <w:LsdException Locked="false" Priority="68" Name="Medium Grid 2 Accent 3"/>
  <w:LsdException Locked="false" Priority="69" Name="Medium Grid 3 Accent 3"/>
  <w:LsdException Locked="false" Priority="70" Name="Dark List Accent 3"/>
  <w:LsdException Locked="false" Priority="71" Name="Colorful Shading Accent 3"/>
  <w:LsdException Locked="false" Priority="72" Name="Colorful List Accent 3"/>
  <w:LsdException Locked="false" Priority="73" Name="Colorful Grid Accent 3"/>
  <w:LsdException Locked="false" Priority="60" Name="Light Shading Accent 4"/>
  <w:LsdException Locked="false" Priority="61" Name="Light List Accent 4"/>
  <w:LsdException Locked="false" Priority="62" Name="Light Grid Accent 4"/>
  <w:LsdException Locked="false" Priority="63" Name="Medium Shading 1 Accent 4"/>
  <w:LsdException Locked="false" Priority="64" Name="Medium Shading 2 Accent 4"/>
  <w:LsdException Locked="false" Priority="65" Name="Medium List 1 Accent 4"/>
  <w:LsdException Locked="false" Priority="66" Name="Medium List 2 Accent 4"/>
  <w:LsdException Locked="false" Priority="67" Name="Medium Grid 1 Accent 4"/>
  <w:LsdException Locked="false" Priority="68" Name="Medium Grid 2 Accent 4"/>
  <w:LsdException Locked="false" Priority="69" Name="Medium Grid 3 Accent 4"/>
  <w:LsdException Locked="false" Priority="70" Name="Dark List Accent 4"/>
  <w:LsdException Locked="false" Priority="71" Name="Colorful Shading Accent 4"/>
  <w:LsdException Locked="false" Priority="72" Name="Colorful List Accent 4"/>
  <w:LsdException Locked="false" Priority="73" Name="Colorful Grid Accent 4"/>
  <w:LsdException Locked="false" Priority="60" Name="Light Shading Accent 5"/>
  <w:LsdException Locked="false" Priority="61" Name="Light List Accent 5"/>
  <w:LsdException Locked="false" Priority="62" Name="Light Grid Accent 5"/>
  <w:LsdException Locked="false" Priority="63" Name="Medium Shading 1 Accent 5"/>
  <w:LsdException Locked="false" Priority="64" Name="Medium Shading 2 Accent 5"/>
  <w:LsdException Locked="false" Priority="65" Name="Medium List 1 Accent 5"/>
  <w:LsdException Locked="false" Priority="66" Name="Medium List 2 Accent 5"/>
  <w:LsdException Locked="false" Priority="67" Name="Medium Grid 1 Accent 5"/>
  <w:LsdException Locked="false" Priority="68" Name="Medium Grid 2 Accent 5"/>
  <w:LsdException Locked="false" Priority="69" Name="Medium Grid 3 Accent 5"/>
  <w:LsdException Locked="false" Priority="70" Name="Dark List Accent 5"/>
  <w:LsdException Locked="false" Priority="71" Name="Colorful Shading Accent 5"/>
  <w:LsdException Locked="false" Priority="72" Name="Colorful List Accent 5"/>
  <w:LsdException Locked="false" Priority="73" Name="Colorful Grid Accent 5"/>
  <w:LsdException Locked="false" Priority="60" Name="Light Shading Accent 6"/>
  <w:LsdException Locked="false" Priority="61" Name="Light List Accent 6"/>
  <w:LsdException Locked="false" Priority="62" Name="Light Grid Accent 6"/>
  <w:LsdException Locked="false" Priority="63" Name="Medium Shading 1 Accent 6"/>
  <w:LsdException Locked="false" Priority="64" Name="Medium Shading 2 Accent 6"/>
  <w:LsdException Locked="false" Priority="65" Name="Medium List 1 Accent 6"/>
  <w:LsdException Locked="false" Priority="66" Name="Medium List 2 Accent 6"/>
  <w:LsdException Locked="false" Priority="67" Name="Medium Grid 1 Accent 6"/>
  <w:LsdException Locked="false" Priority="68" Name="Medium Grid 2 Accent 6"/>
  <w:LsdException Locked="false" Priority="69" Name="Medium Grid 3 Accent 6"/>
  <w:LsdException Locked="false" Priority="70" Name="Dark List Accent 6"/>
  <w:LsdException Locked="false" Priority="71" Name="Colorful Shading Accent 6"/>
  <w:LsdException Locked="false" Priority="72" Name="Colorful List Accent 6"/>
  <w:LsdException Locked="false" Priority="73" Name="Colorful Grid Accent 6"/>
  <w:LsdException Locked="false" Priority="19" QFormat="true"
   Name="Subtle Emphasis"/>
  <w:LsdException Locked="false" Priority="21" QFormat="true"
   Name="Intense Emphasis"/>
  <w:LsdException Locked="false" Priority="31" QFormat="true"
   Name="Subtle Reference"/>
  <w:LsdException Locked="false" Priority="32" QFormat="true"
   Name="Intense Reference"/>
  <w:LsdException Locked="false" Priority="33" QFormat="true" Name="Book Title"/>
  <w:LsdException Locked="false" Priority="37" SemiHidden="true"
   UnhideWhenUsed="true" Name="Bibliography"/>
  <w:LsdException Locked="false" Priority="39" SemiHidden="true"
   UnhideWhenUsed="true" QFormat="true" Name="TOC Heading"/>
  <w:LsdException Locked="false" Priority="49" Name="Grid Table 4"/>
  <w:LsdException Locked="false" Priority="50" Name="Grid Table 5 Dark"/>
  <w:LsdException Locked="false" Priority="51" Name="Grid Table 6 Colorful"/>
  <w:LsdException Locked="false" Priority="52" Name="Grid Table 7 Colorful"/>
  <w:LsdException Locked="false" Priority="46"
   Name="Grid Table 1 Light Accent 1"/>
  <w:LsdException Locked="false" Priority="47" Name="Grid Table 2 Accent 1"/>
  <w:LsdException Locked="false" Priority="48" Name="Grid Table 3 Accent 1"/>
  <w:LsdException Locked="false" Priority="49" Name="Grid Table 4 Accent 1"/>
  <w:LsdException Locked="false" Priority="50" Name="Grid Table 5 Dark Accent 1"/>
  <w:LsdException Locked="false" Priority="51"
   Name="Grid Table 6 Colorful Accent 1"/>
  <w:LsdException Locked="false" Priority="52"
   Name="Grid Table 7 Colorful Accent 1"/>
  <w:LsdException Locked="false" Priority="46"
   Name="Grid Table 1 Light Accent 2"/>
  <w:LsdException Locked="false" Priority="47" Name="Grid Table 2 Accent 2"/>
  <w:LsdException Locked="false" Priority="48" Name="Grid Table 3 Accent 2"/>
  <w:LsdException Locked="false" Priority="49" Name="Grid Table 4 Accent 2"/>
  <w:LsdException Locked="false" Priority="50" Name="Grid Table 5 Dark Accent 2"/>
  <w:LsdException Locked="false" Priority="51"
   Name="Grid Table 6 Colorful Accent 2"/>
  <w:LsdException Locked="false" Priority="52"
   Name="Grid Table 7 Colorful Accent 2"/>
  <w:LsdException Locked="false" Priority="46"
   Name="Grid Table 1 Light Accent 3"/>
  <w:LsdException Locked="false" Priority="47" Name="Grid Table 2 Accent 3"/>
  <w:LsdException Locked="false" Priority="48" Name="Grid Table 3 Accent 3"/>
  <w:LsdException Locked="false" Priority="49" Name="Grid Table 4 Accent 3"/>
  <w:LsdException Locked="false" Priority="50" Name="Grid Table 5 Dark Accent 3"/>
  <w:LsdException Locked="false" Priority="51"
   Name="Grid Table 6 Colorful Accent 3"/>
  <w:LsdException Locked="false" Priority="52"
   Name="Grid Table 7 Colorful Accent 3"/>
  <w:LsdException Locked="false" Priority="46"
   Name="Grid Table 1 Light Accent 4"/>
  <w:LsdException Locked="false" Priority="47" Name="Grid Table 2 Accent 4"/>
  <w:LsdException Locked="false" Priority="48" Name="Grid Table 3 Accent 4"/>
  <w:LsdException Locked="false" Priority="49" Name="Grid Table 4 Accent 4"/>
  <w:LsdException Locked="false" Priority="50" Name="Grid Table 5 Dark Accent 4"/>
  <w:LsdException Locked="false" Priority="51"
   Name="Grid Table 6 Colorful Accent 4"/>
  <w:LsdException Locked="false" Priority="52"
   Name="Grid Table 7 Colorful Accent 4"/>
  <w:LsdException Locked="false" Priority="46"
   Name="Grid Table 1 Light Accent 5"/>
  <w:LsdException Locked="false" Priority="47" Name="Grid Table 2 Accent 5"/>
  <w:LsdException Locked="false" Priority="48" Name="Grid Table 3 Accent 5"/>
  <w:LsdException Locked="false" Priority="49" Name="Grid Table 4 Accent 5"/>
  <w:LsdException Locked="false" Priority="50" Name="Grid Table 5 Dark Accent 5"/>
  <w:LsdException Locked="false" Priority="51"
   Name="Grid Table 6 Colorful Accent 5"/>
  <w:LsdException Locked="false" Priority="52"
   Name="Grid Table 7 Colorful Accent 5"/>
  <w:LsdException Locked="false" Priority="46"
   Name="Grid Table 1 Light Accent 6"/>
  <w:LsdException Locked="false" Priority="47" Name="Grid Table 2 Accent 6"/>
  <w:LsdException Locked="false" Priority="48" Name="Grid Table 3 Accent 6"/>
  <w:LsdException Locked="false" Priority="49" Name="Grid Table 4 Accent 6"/>
  <w:LsdException Locked="false" Priority="50" Name="Grid Table 5 Dark Accent 6"/>
  <w:LsdException Locked="false" Priority="51"
   Name="Grid Table 6 Colorful Accent 6"/>
  <w:LsdException Locked="false" Priority="52"
   Name="Grid Table 7 Colorful Accent 6"/>
  <w:LsdException Locked="false" Priority="46" Name="List Table 1 Light"/>
  <w:LsdException Locked="false" Priority="47" Name="List Table 2"/>
  <w:LsdException Locked="false" Priority="48" Name="List Table 3"/>
  <w:LsdException Locked="false" Priority="49" Name="List Table 4"/>
  <w:LsdException Locked="false" Priority="50" Name="List Table 5 Dark"/>
  <w:LsdException Locked="false" Priority="51" Name="List Table 6 Colorful"/>
  <w:LsdException Locked="false" Priority="52" Name="List Table 7 Colorful"/>
  <w:LsdException Locked="false" Priority="46"
   Name="List Table 1 Light Accent 1"/>
  <w:LsdException Locked="false" Priority="47" Name="List Table 2 Accent 1"/>
  <w:LsdException Locked="false" Priority="48" Name="List Table 3 Accent 1"/>
  <w:LsdException Locked="false" Priority="49" Name="List Table 4 Accent 1"/>
  <w:LsdException Locked="false" Priority="50" Name="List Table 5 Dark Accent 1"/>
  <w:LsdException Locked="false" Priority="51"
   Name="List Table 6 Colorful Accent 1"/>
  <w:LsdException Locked="false" Priority="52"
   Name="List Table 7 Colorful Accent 1"/>
  <w:LsdException Locked="false" Priority="46"
   Name="List Table 1 Light Accent 2"/>
  <w:LsdException Locked="false" Priority="47" Name="List Table 2 Accent 2"/>
  <w:LsdException Locked="false" Priority="48" Name="List Table 3 Accent 2"/>
  <w:LsdException Locked="false" Priority="49" Name="List Table 4 Accent 2"/>
  <w:LsdException Locked="false" Priority="50" Name="List Table 5 Dark Accent 2"/>
  <w:LsdException Locked="false" Priority="51"
   Name="List Table 6 Colorful Accent 2"/>
  <w:LsdException Locked="false" Priority="52"
   Name="List Table 7 Colorful Accent 2"/>
  <w:LsdException Locked="false" Priority="46"
   Name="List Table 1 Light Accent 3"/>
  <w:LsdException Locked="false" Priority="47" Name="List Table 2 Accent 3"/>
  <w:LsdException Locked="false" Priority="48" Name="List Table 3 Accent 3"/>
  <w:LsdException Locked="false" Priority="49" Name="List Table 4 Accent 3"/>
  <w:LsdException Locked="false" Priority="50" Name="List Table 5 Dark Accent 3"/>
  <w:LsdException Locked="false" Priority="51"
   Name="List Table 6 Colorful Accent 3"/>
  <w:LsdException Locked="false" Priority="52"
   Name="List Table 7 Colorful Accent 3"/>
  <w:LsdException Locked="false" Priority="46"
   Name="List Table 1 Light Accent 4"/>
  <w:LsdException Locked="false" Priority="47" Name="List Table 2 Accent 4"/>
  <w:LsdException Locked="false" Priority="48" Name="List Table 3 Accent 4"/>
  <w:LsdException Locked="false" Priority="49" Name="List Table 4 Accent 4"/>
  <w:LsdException Locked="false" Priority="50" Name="List Table 5 Dark Accent 4"/>
  <w:LsdException Locked="false" Priority="51"
   Name="List Table 6 Colorful Accent 4"/>
  <w:LsdException Locked="false" Priority="52"
   Name="List Table 7 Colorful Accent 4"/>
  <w:LsdException Locked="false" Priority="46"
   Name="List Table 1 Light Accent 5"/>
  <w:LsdException Locked="false" Priority="47" Name="List Table 2 Accent 5"/>
  <w:LsdException Locked="false" Priority="48" Name="List Table 3 Accent 5"/>
  <w:LsdException Locked="false" Priority="49" Name="List Table 4 Accent 5"/>
  <w:LsdException Locked="false" Priority="50" Name="List Table 5 Dark Accent 5"/>
  <w:LsdException Locked="false" Priority="51"
   Name="List Table 6 Colorful Accent 5"/>
  <w:LsdException Locked="false" Priority="52"
   Name="List Table 7 Colorful Accent 5"/>
  <w:LsdException Locked="false" Priority="46"
   Name="List Table 1 Light Accent 6"/>
  <w:LsdException Locked="false" Priority="47" Name="List Table 2 Accent 6"/>
  <w:LsdException Locked="false" Priority="48" Name="List Table 3 Accent 6"/>
  <w:LsdException Locked="false" Priority="49" Name="List Table 4 Accent 6"/>
  <w:LsdException Locked="false" Priority="50" Name="List Table 5 Dark Accent 6"/>
  <w:LsdException Locked="false" Priority="51"
   Name="List Table 6 Colorful Accent 6"/>
  <w:LsdException Locked="false" Priority="52"
   Name="List Table 7 Colorful Accent 6"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Mention"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Smart Hyperlink"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Hashtag"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Unresolved Mention"/>
  <w:LsdException Locked="false" SemiHidden="true" UnhideWhenUsed="true"
   Name="Smart Link"/>
 </w:LatentStyles>
</xml><![endif]-->
<style>
<!--
 /* Font Definitions */
 @font-face
	{font-family:Wingdings;
	panose-1:5 0 0 0 0 0 0 0 0 0;
	mso-font-charset:77;
	mso-generic-font-family:decorative;
	mso-font-pitch:variable;
	mso-font-signature:3 0 0 0 -2147483647 0;}
@font-face
	{font-family:"Cambria Math";
	panose-1:2 4 5 3 5 4 6 3 2 4;
	mso-font-charset:0;
	mso-generic-font-family:roman;
	mso-font-pitch:variable;
	mso-font-signature:-536870145 1107305727 0 0 415 0;}
@font-face
	{font-family:Calibri;
	panose-1:2 15 5 2 2 2 4 3 2 4;
	mso-font-charset:0;
	mso-generic-font-family:swiss;
	mso-font-pitch:variable;
	mso-font-signature:-536859905 -1073732485 9 0 511 0;}
 /* Style Definitions */
 p.MsoNormal, li.MsoNormal, div.MsoNormal
	{mso-style-unhide:no;
	mso-style-qformat:yes;
	mso-style-parent:"";
	margin:0in;
	mso-pagination:widow-orphan;
	font-size:12.0pt;
	font-family:"Calibri",sans-serif;
	mso-ascii-font-family:Calibri;
	mso-ascii-theme-font:minor-latin;
	mso-fareast-font-family:Calibri;
	mso-fareast-theme-font:minor-latin;
	mso-hansi-font-family:Calibri;
	mso-hansi-theme-font:minor-latin;
	mso-bidi-font-family:"Times New Roman";
	mso-bidi-theme-font:minor-bidi;}
a:link, span.MsoHyperlink
	{mso-style-priority:99;
	color:blue;
	text-decoration:underline;
	text-underline:single;}
a:visited, span.MsoHyperlinkFollowed
	{mso-style-noshow:yes;
	mso-style-priority:99;
	color:#954F72;
	mso-themecolor:followedhyperlink;
	text-decoration:underline;
	text-underline:single;}
p
	{mso-style-noshow:yes;
	mso-style-priority:99;
	mso-margin-top-alt:auto;
	margin-right:0in;
	mso-margin-bottom-alt:auto;
	margin-left:0in;
	mso-pagination:widow-orphan;
	font-size:12.0pt;
	font-family:"Times New Roman",serif;
	mso-fareast-font-family:"Times New Roman";}
p.MsoListParagraph, li.MsoListParagraph, div.MsoListParagraph
	{mso-style-noshow:yes;
	mso-style-priority:34;
	mso-style-unhide:no;
	mso-style-qformat:yes;
	margin-top:0in;
	margin-right:0in;
	margin-bottom:0in;
	margin-left:.5in;
	mso-add-space:auto;
	mso-pagination:widow-orphan;
	font-size:12.0pt;
	font-family:"Calibri",sans-serif;
	mso-ascii-font-family:Calibri;
	mso-ascii-theme-font:minor-latin;
	mso-fareast-font-family:Calibri;
	mso-fareast-theme-font:minor-latin;
	mso-hansi-font-family:Calibri;
	mso-hansi-theme-font:minor-latin;
	mso-bidi-font-family:"Times New Roman";
	mso-bidi-theme-font:minor-bidi;}
p.MsoListParagraphCxSpFirst, li.MsoListParagraphCxSpFirst, div.MsoListParagraphCxSpFirst
	{mso-style-noshow:yes;
	mso-style-priority:34;
	mso-style-unhide:no;
	mso-style-qformat:yes;
	mso-style-type:export-only;
	margin-top:0in;
	margin-right:0in;
	margin-bottom:0in;
	margin-left:.5in;
	mso-add-space:auto;
	mso-pagination:widow-orphan;
	font-size:12.0pt;
	font-family:"Calibri",sans-serif;
	mso-ascii-font-family:Calibri;
	mso-ascii-theme-font:minor-latin;
	mso-fareast-font-family:Calibri;
	mso-fareast-theme-font:minor-latin;
	mso-hansi-font-family:Calibri;
	mso-hansi-theme-font:minor-latin;
	mso-bidi-font-family:"Times New Roman";
	mso-bidi-theme-font:minor-bidi;}
p.MsoListParagraphCxSpMiddle, li.MsoListParagraphCxSpMiddle, div.MsoListParagraphCxSpMiddle
	{mso-style-noshow:yes;
	mso-style-priority:34;
	mso-style-unhide:no;
	mso-style-qformat:yes;
	mso-style-type:export-only;
	margin-top:0in;
	margin-right:0in;
	margin-bottom:0in;
	margin-left:.5in;
	mso-add-space:auto;
	mso-pagination:widow-orphan;
	font-size:12.0pt;
	font-family:"Calibri",sans-serif;
	mso-ascii-font-family:Calibri;
	mso-ascii-theme-font:minor-latin;
	mso-fareast-font-family:Calibri;
	mso-fareast-theme-font:minor-latin;
	mso-hansi-font-family:Calibri;
	mso-hansi-theme-font:minor-latin;
	mso-bidi-font-family:"Times New Roman";
	mso-bidi-theme-font:minor-bidi;}
p.MsoListParagraphCxSpLast, li.MsoListParagraphCxSpLast, div.MsoListParagraphCxSpLast
	{mso-style-noshow:yes;
	mso-style-priority:34;
	mso-style-unhide:no;
	mso-style-qformat:yes;
	mso-style-type:export-only;
	margin-top:0in;
	margin-right:0in;
	margin-bottom:0in;
	margin-left:.5in;
	mso-add-space:auto;
	mso-pagination:widow-orphan;
	font-size:12.0pt;
	font-family:"Calibri",sans-serif;
	mso-ascii-font-family:Calibri;
	mso-ascii-theme-font:minor-latin;
	mso-fareast-font-family:Calibri;
	mso-fareast-theme-font:minor-latin;
	mso-hansi-font-family:Calibri;
	mso-hansi-theme-font:minor-latin;
	mso-bidi-font-family:"Times New Roman";
	mso-bidi-theme-font:minor-bidi;}
p.msonormal0, li.msonormal0, div.msonormal0
	{mso-style-name:msonormal;
	mso-style-noshow:yes;
	mso-style-priority:99;
	mso-style-unhide:no;
	mso-margin-top-alt:auto;
	margin-right:0in;
	mso-margin-bottom-alt:auto;
	margin-left:0in;
	mso-pagination:widow-orphan;
	font-size:12.0pt;
	font-family:"Times New Roman",serif;
	mso-fareast-font-family:"Times New Roman";
	mso-fareast-theme-font:minor-fareast;}
p.Default, li.Default, div.Default
	{mso-style-name:Default;
	mso-style-noshow:yes;
	mso-style-priority:99;
	mso-style-unhide:no;
	mso-style-parent:"";
	margin:0in;
	mso-pagination:none;
	mso-layout-grid-align:none;
	text-autospace:none;
	font-size:12.0pt;
	font-family:"Arial",sans-serif;
	mso-fareast-font-family:Calibri;
	mso-fareast-theme-font:minor-latin;
	color:black;}
span.notereqd
	{mso-style-name:notereqd;
	mso-style-unhide:no;}
span.SpellE
	{mso-style-name:"";
	mso-spl-e:yes;}
span.GramE
	{mso-style-name:"";
	mso-gram-e:yes;}
.MsoChpDefault
	{mso-style-type:export-only;
	mso-default-props:yes;
	font-size:10.0pt;
	mso-ansi-font-size:10.0pt;
	mso-bidi-font-size:10.0pt;
	font-family:"Calibri",sans-serif;
	mso-ascii-font-family:Calibri;
	mso-ascii-theme-font:minor-latin;
	mso-fareast-font-family:Calibri;
	mso-fareast-theme-font:minor-latin;
	mso-hansi-font-family:Calibri;
	mso-hansi-theme-font:minor-latin;
	mso-bidi-font-family:"Times New Roman";
	mso-bidi-theme-font:minor-bidi;
	mso-font-kerning:0pt;
	mso-ligatures:none;}
@page WordSection1
	{size:8.5in 11.0in;
	margin:1.0in 1.0in 1.0in 1.0in;
	mso-header-margin:.5in;
	mso-footer-margin:.5in;
	mso-paper-source:0;}
div.WordSection1
	{page:WordSection1;}
 /* List Definitions */
 @list l0
	{mso-list-id:1901331129;
	mso-list-type:hybrid;
	mso-list-template-ids:677944108 67698703 -1 -1 -1 -1 -1 -1 -1 -1;}
@list l0:level1
	{mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;}
@list l0:level2
	{mso-level-number-format:bullet;
	mso-level-text:o;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:"Courier New";}
@list l0:level3
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Wingdings;}
@list l0:level4
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Symbol;}
@list l0:level5
	{mso-level-number-format:bullet;
	mso-level-text:o;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:"Courier New";}
@list l0:level6
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Wingdings;}
@list l0:level7
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Symbol;}
@list l0:level8
	{mso-level-number-format:bullet;
	mso-level-text:o;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:"Courier New";}
@list l0:level9
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Wingdings;}
@list l1
	{mso-list-id:2001153537;
	mso-list-type:hybrid;
	mso-list-template-ids:867879558 67698689 67698691 67698693 67698689 67698691 67698693 67698689 67698691 67698693;}
@list l1:level1
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Symbol;}
@list l1:level2
	{mso-level-number-format:bullet;
	mso-level-text:o;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:"Courier New";}
@list l1:level3
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Wingdings;}
@list l1:level4
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Symbol;}
@list l1:level5
	{mso-level-number-format:bullet;
	mso-level-text:o;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:"Courier New";}
@list l1:level6
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Wingdings;}
@list l1:level7
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Symbol;}
@list l1:level8
	{mso-level-number-format:bullet;
	mso-level-text:o;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:"Courier New";}
@list l1:level9
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Wingdings;}
@list l2
	{mso-list-id:2132090378;
	mso-list-type:hybrid;
	mso-list-template-ids:677944108 -1 -1 -1 -1 -1 -1 -1 -1 -1;}
@list l2:level1
	{mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;}
@list l2:level2
	{mso-level-number-format:bullet;
	mso-level-text:o;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:"Courier New";}
@list l2:level3
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Wingdings;}
@list l2:level4
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Symbol;}
@list l2:level5
	{mso-level-number-format:bullet;
	mso-level-text:o;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:"Courier New";}
@list l2:level6
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Wingdings;}
@list l2:level7
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Symbol;}
@list l2:level8
	{mso-level-number-format:bullet;
	mso-level-text:o;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:"Courier New";}
@list l2:level9
	{mso-level-number-format:bullet;
	mso-level-text:;
	mso-level-tab-stop:none;
	mso-level-number-position:left;
	text-indent:-.25in;
	font-family:Wingdings;}
ol
	{margin-bottom:0in;}
ul
	{margin-bottom:0in;}
-->
</style>
<!--[if gte mso 10]>
<style>
 /* Style Definitions */
 table.MsoNormalTable
	{mso-style-name:"Table Normal";
	mso-tstyle-rowband-size:0;
	mso-tstyle-colband-size:0;
	mso-style-noshow:yes;
	mso-style-priority:99;
	mso-style-parent:"";
	mso-padding-alt:0in 5.4pt 0in 5.4pt;
	mso-para-margin:0in;
	mso-pagination:widow-orphan;
	font-size:10.0pt;
	font-family:"Calibri",sans-serif;
	mso-ascii-font-family:Calibri;
	mso-ascii-theme-font:minor-latin;
	mso-hansi-font-family:Calibri;
	mso-hansi-theme-font:minor-latin;
	mso-bidi-font-family:"Times New Roman";
	mso-bidi-theme-font:minor-bidi;}
</style>
<![endif]-->
<meta name=Title content="">
<meta name=Keywords content="">
<!--[if gte mso 9]><xml>
 <o:shapedefaults v:ext="edit" spidmax="1026"/>
</xml><![endif]--><!--[if gte mso 9]><xml>
 <o:shapelayout v:ext="edit">
  <o:idmap v:ext="edit" data="1"/>
 </o:shapelayout></xml><![endif]-->
</head>

<body lang=EN-US link=blue vlink="#954F72" style='tab-interval:.5in;word-wrap:
break-word'>

<div class=WordSection1>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:17.0pt;font-family:"Times New Roman",serif'>III: Small:
In-memory, Distributed, and Adaptive <span class=SpellE>Spatio</span>-textual
Query Processing<o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><b><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>Contact
Information<o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>Walid G. Aref<o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>Department of
Computer Science<o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>Purdue University<o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>305 N. University
Street<o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>West Lafayette,
Indiana 47907<o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>Phone: (765)
494-1997 <o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
class=GramE><span style='font-size:11.0pt;font-family:"Times New Roman",serif'>Fax
:</span></span><span style='font-size:11.0pt;font-family:"Times New Roman",serif'>
(765) 494-0739 <o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>Email:
aref@cs.purdue.edu <o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>URL:
http://www.cs.purdue.edu/faculty/aref.html<o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'><span
style='mso-spacerun:yes'> </span><o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><b
style='mso-bidi-font-weight:normal'><i><span style='font-size:10.0pt'>This
material is based upon work supported by the National Science Foundation under
Grant No. III-1815796.</span></i></b><span style='font-size:11.0pt;font-family:
"Times New Roman",serif'><o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><b><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'><o:p>&nbsp;</o:p></span></b></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><b><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>Project Award
Information<o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>NSF Award Number:
III-1815796 <o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>Duration: 8/1/2018
-- 7/31/2022<o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>Title: In-memory,
Distributed, and Adaptive <span class=SpellE>Spatio</span>-textual Query
Processing<o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>PI: Walid G. Aref<o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>Project Web Page: <o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>http://www.cs.purdue.edu/homes/aref/IDAS<o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><b><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>Project Focus: <o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>The widespread use
of GPS-enabled smartphones along with the popularity of microblogging and
social networking, e.g., Twitter and Facebook, has resulted in producing large
amounts of text data. Typically, this text data, e.g., the tweets, are
geo-tagged by the location in which the text data has been produced. Many
applications make good use of this stream of geo-tagged text data (also termed
spatial-keyword or <span class=SpellE>spatio</span>-textual data), and provide
services to users based on the textual and the spatial components of the data.
Applications need to process large number of user queries against <span
class=SpellE>spatio</span>-textual data. For example, in location-aware ad
targeting publish/subscribe systems, it is required to disseminate millions of
ads and promotions to millions of users based on the users' locations and
textual profiles. This project will address the hurdles that face these
applications and their underlying systems in order to function properly. <o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>More specifically,
this project will address the following research challenges that face <span
class=SpellE>spatio</span>-textual servers:<o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><b><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>(1)</span></b><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'> <b>The
scalability challenge</b> to support large amounts of <span class=SpellE>spatio</span>-textual
data streams and queries<o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>in real-time,<o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><b><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>(2)</span></b><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'> <b>The
expressiveness challenge</b> that is exemplified in the lack of mechanisms that
adequately express complex <span class=SpellE>spatio</span>-textual queries. Querying
capabilities need to match the growing sophistication and complexity of the
continuously evolving location services, and <o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><b><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>(3) The adaptivity
challenge</span></b><span style='font-size:11.0pt;font-family:"Times New Roman",serif'>,
where systems need to adapt to changes in data distribution over time.<o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>In location
services, location-data distribution, users' interests, and hot keyword topics
change over time. A scalable <span class=SpellE>spatio</span>-textual server
needs to continuously adapt to these changes. The project will address these
scalability, expressiveness, and adaptivity challenges when processing large
amounts of queries on continuously-streamed <span class=SpellE>spatio</span>-textual
data. The project will investigate how to support <span class=SpellE>spatio</span>-textual
data and queries as first-class citizens in an in-memory distributed data
system. Scalable architectures for handling large amounts of <span
class=SpellE>spatio</span>-textual data and continuous queries will be
investigated. In contrast to tailored solutions, relational-like <span
class=SpellE>spatio</span>-textual building-block operators will be developed
to express extended-SQL <span class=SpellE>spatio</span>-textual queries along
with costing, algebraic transformation rules, and query optimization
techniques. To address scalability and the variation in the workload, adaptive
and frequency-aware in-memory distributed indexing and query processing
techniques will be developed to dynamically organize and process the
continuously-evolving <span class=SpellE>spatio</span>-textual data. The <span
class=SpellE>spatio</span>-textual indexing and query processing techniques to
be developed will dynamically account for the changes and differences in the
frequencies of keywords within the various spatial regions to automatically
choose the best <span class=SpellE>spatio</span>-textual data organization that
optimizes the system performance.<o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'>For further
information see the project web page:<span style='mso-spacerun:yes'>  </span><a
href="https://www.cs.purdue.edu/homes/aref/IDAS">https://www.cs.purdue.edu/homes/aref/IDAS</a><o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><b><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'><a href="#Y18">2018-2019 Project Activities</a><o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><b><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'><a href="#Y19">2019-2020 Project Activities</a><o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><b><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'><a href="#Y20">2020-2021 Project Activities</a><o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><b><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'><a href="#Y21">2021-2022 Project Activities</a><o:p></o:p></span></b></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><a
name=Y18><b><span style='font-size:10.5pt;font-family:"Arial",sans-serif;
mso-fareast-font-family:"Times New Roman";color:black'>2018-2019 Project
Activities</span></b></a><b><span style='font-size:10.5pt;font-family:"Arial",sans-serif;
mso-fareast-font-family:"Times New Roman";color:black'>:</span></b><b><span
style='font-size:11.0pt;font-family:"Times New Roman",serif'><o:p></o:p></span></b></p>

<p class=MsoNormal style='line-height:15.0pt;vertical-align:baseline'><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'>During the 2018-2019 Academic year, the first
year of this project, we started with two tutorial and survey activities. Along
with my former Ph.D. student, we published a monograph on the subject of
scalable processing of spatial keyword queries. The monograph was published
with the Morgan and Claypool Publishers in the series Synthesis Lectures on
Data Management. Also, we published a survey on spatial access methods that
appeared in the Springer <span class=SpellE>GeoInformatica</span> Journal early
in the year. We developed and prototyped new capabilities for adaptive query
processing in our spatial-keyword system, Tornado. This work was reported at
the ACM SIGSPATIAL Conference. We developed in-memory distributed spatial query
processing and optimization techniques, our <span class=SpellE>LocationSpark</span>
system. A detailed version of <span class=SpellE>LocationSpark</span> is
currently under review and is available in the <span class=SpellE>ArXiv</span>.
We developed the&nbsp;<span class=SpellE>ExplainER</span> prototype system to
understand and explain entity resolution classifiers with different granularity
levels of explanations.&nbsp;<span class=SpellE>ExplainER</span> was
demonstrated at the IEEE ICDE 2019 conference and was awarded the best demo
award at the conference. We developed&nbsp;a vision paper reflecting an
end-to-end human-centric data cleaning framework that was presented in the ACM
HILDA Workshop in July 2019.<o:p></o:p></span></p>

<p class=MsoNormal style='margin-top:7.5pt;margin-right:0in;margin-bottom:7.5pt;
margin-left:0in;line-height:15.0pt;vertical-align:baseline'><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'>Over the Fall 2018 and Spring 2019 semesters,
Walid led a group of undergraduate students to conduct undergraduate research
in topics related to this project. Details about these research and education
activities will be given below.&nbsp;<o:p></o:p></span></p>

<p class=MsoNormal style='line-height:15.0pt;vertical-align:baseline'><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'>This year, Walid gave a keynote speech titled:
“The Dos and Don’ts of <span class=SpellE>Location+X</span> Data Management: A
Systems Perspective<i><span style='border:none windowtext 1.0pt;mso-border-alt:
none windowtext 0in;padding:0in'>”&nbsp;</span></i>at the 20th IEEE
International Conference on Mobile Data Management in Hong Kong in June 2019.
Also, Walid is the 2019 co-chair for the program committee of the 16th
International Symposium on Spatial and Temporal Databases that will take place
in Vienna later this year.&nbsp;<o:p></o:p></span></p>

<p class=MsoNormal style='line-height:15.0pt;vertical-align:baseline'><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='line-height:15.0pt;vertical-align:baseline'><b><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black;border:none windowtext 1.0pt;mso-border-alt:none windowtext 0in;
padding:0in'><a
href="http://www.morganclaypoolpublishers.com/catalog_Orig/product_info.php?products_id=1358">Scalable
Processing of Spatial-Keyword Queries [Monograph 2019].</a>&nbsp;</span></b><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'>Within the scope of this project, my former
student and I have developed an educational milestone for this project. We
wrote a manuscript for scalable query processing techniques for spatial keyword
data. This 110+ pages monograph was published with Morgan and Claypool in
their&nbsp;series Synthesis Lectures on Data Management. The monograph
addresses&nbsp;text data that is associated with location data and that has
become ubiquitous. A tweet is an example of this type of data, where the text
in a tweet is associated with the location where the tweet has been issued. We
use the term spatial-keyword data to refer to this type of data.
Spatial-keyword data is being generated at massive scale. Almost all online
transactions have an associated spatial-trace. The spatial trace is derived
from GPS coordinates, IP addresses, or cell-phone-tower locations. Hundreds of
millions or even billions of spatial-keyword objects are being generated daily.
Spatial-keyword data has numerous applications that require efficient processing
and management of massive amounts of spatial-keyword data. The monograph starts
by overviewing some important applications of spatial-keyword data, and
demonstrates the scale at which spatial-keyword data is being generated. Then,
it formalizes and classifies the various types of queries that execute over
spatial-keyword data. Then, it discusses important and desirable properties of
spatial-keyword query languages that are needed to express queries over
spatial-keyword data. Existing spatial-keyword query languages vary in the
types of spatial-keyword queries that they can support. There are many systems
that process spatial-keyword queries. Systems differ from each other in various
aspects, e.g., whether the system is batch-oriented or stream-based, and whether
the system is centralized or distributed. Moreover, spatial-keyword systems
vary in the types of queries that they support. Finally, systems vary in the
types of indexing techniques that they adopt. The monograph overviews the main
spatial-keyword data-management systems (SK-DMS, for short), and classifies
them according to their features. Moreover, the monograph describes the main
approaches adopted when indexing spatial-keyword data in the centralized and
distributed settings. Several case-studies of SK-DMSs are presented along with
the applications and query types that these SK-DMSs are targeted for and the
indexing techniques they utilize for processing their queries. Optimizing the
performance and the query processing of SK-DMSs still has many research
challenges and open problems. The monograph concludes with a discussion about
several important and open research-problems in the domain of scalable
spatial-keyword processing.&nbsp;<o:p></o:p></span></p>

<p class=MsoNormal style='margin-left:.5in;line-height:15.0pt;vertical-align:
baseline'><span style='font-size:10.5pt;font-family:"Arial",sans-serif;
mso-fareast-font-family:"Times New Roman";color:black'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='line-height:15.0pt;vertical-align:baseline'><b><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black;border:none windowtext 1.0pt;mso-border-alt:none windowtext 0in;
padding:0in'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/A-tornado-sigspatial-2018.pdf">Adaptive
Processing of Spatial-Keyword Data Over a Distributed Streaming Cluster
(SIGSPATIAL 2018).</a> </span></b><span style='font-size:10.5pt;font-family:
"Arial",sans-serif;mso-fareast-font-family:"Times New Roman";color:black'>The
widespread use of GPS-enabled smartphones along with the popularity of
micro-blogging and social networking applications, e.g., Twitter and Facebook,
has resulted in the generation of huge streams of geo-tagged textual data. Many
applications require real-time processing of these streams. For example,
location-based ad targeting systems enable advertisers to register millions of
ads to millions of users based on the users’ location and textual profile.
Existing streaming systems are either centralized or are not spatial-keyword
aware, and hence these systems cannot efficiently support the processing of
rapidly arriving spatial-keyword data streams. In this research, we introduce a
two-layered indexing scheme for the distributed processing of spatial-keyword
data streams. We realize this indexing scheme in Tornado, a distributed
spatial-keyword streaming system. The first layer, termed the routing layer, is
used to fairly distribute the workload, and furthermore, co-locate the data
objects and the corresponding queries at the same processing units. The routing
layer uses the Augmented-Grid, a novel structure that is equipped with an
efficient search algorithm for distributing the data objects and queries. The
second layer, termed the evaluation layer, resides within each processing unit
to reduce the processing overhead. The two-layered index adapts to changes in
the workload by applying a cost formula that continuously represents the
processing overhead at each processing unit. Extensive experimental evaluation
using real Twitter data indicates that Tornado achieves high scalability and
more than 2x improvement over the baseline approach in terms of the overall
system throughput.<o:p></o:p></span></p>

<p class=MsoNormal style='margin-left:.5in;line-height:15.0pt;vertical-align:
baseline'><span style='font-size:10.5pt;font-family:"Arial",sans-serif;
mso-fareast-font-family:"Times New Roman";color:black'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='line-height:15.0pt;vertical-align:baseline'><b><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black;border:none windowtext 1.0pt;mso-border-alt:none windowtext 0in;
padding:0in'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/A-spatio-temporalaccess-methods-geo.pdf"><span
class=SpellE>Spatio</span>-Temporal Access Methods: A Survey (2010 - 2017) (<span
class=SpellE>GeoInformatica</span> 2019).</a>&nbsp;</span></b><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'>The volume of <span class=SpellE>spatio</span>-temporal
data is growing at a rapid pace due to advances in location-aware devices,
e.g., smartphones, and the popularity of location-based services, e.g.,
navigation services. A number of <span class=SpellE>spatio</span>-temporal
access methods have been proposed to support efficient processing of queries
over the <span class=SpellE>spatio</span>-temporal data. <span class=SpellE>Spatio</span>-temporal
access methods can be classified according to the type of data being indexed
into the following categories: (1) indexes for historical <span class=SpellE>spatio</span>-temporal
data, (2) indexes for current and recent <span class=SpellE>spatio</span>-temporal
data, (3) indexes for future <span class=SpellE>spatio</span>-temporal data,
(4) indexes for past, present, and future <span class=SpellE>spatio</span>-temporal
data, (5) indexes for <span class=SpellE>spatio</span>-temporal data with
associated textual data, and (6) parallel and distributed <span class=SpellE>spatio</span>-temporal
systems and indexes. This survey is Part 3 of our two previous surveys on the
same subject that were both published in the IEEE Data Engineering Bulletin. In
this survey, we present an overview and a broad classification of the <span
class=SpellE>spatio</span>-temporal access methods published between 2010 and
2017. <o:p></o:p></span></p>

<p class=MsoNormal style='margin-left:.5in;line-height:15.0pt;vertical-align:
baseline'><span style='font-size:10.5pt;font-family:"Arial",sans-serif;
mso-fareast-font-family:"Times New Roman";color:black'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='line-height:15.0pt;vertical-align:baseline'><b><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black;border:none windowtext 1.0pt;mso-border-alt:none windowtext 0in;
padding:0in'><a href="https://www.cs.purdue.edu/homes/aref/IDAS/A-ExplainER.pdf"><span
class=SpellE>ExplainER</span>: Entity Resolution Explanations&nbsp;(IEEE
ICDE&nbsp;2019 Demo).</a>&nbsp;</span></b><span style='font-size:10.5pt;
font-family:"Arial",sans-serif;mso-fareast-font-family:"Times New Roman";
color:black'>Entity Resolution is a fundamental data cleaning and integration
problem that has received considerable attention in the past few decades. While
rule-based methods have been used in many practical scenarios and are often
easy to understand, machine-learning-based methods provide the best accuracy.
However, the state-of-the-art classifiers are very opaque. There has been some
work towards understanding and debugging the early stages of the entity
resolution pipeline, e.g. blocking and generating features (similarity scores).
However, there are no such efforts for explaining the model or its predictions.
In this demo, we propose <span class=SpellE>ExplainER</span>, a tool to
understand and explain entity resolution classifiers with different granularity
levels of explanations. Using several benchmark datasets, we will demonstrate
how <span class=SpellE>ExplainER</span> can handle different scenarios for a
variety of classifiers. <o:p></o:p></span></p>

<p class=MsoNormal style='line-height:15.0pt;vertical-align:baseline'><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='line-height:15.0pt;vertical-align:baseline'><b><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black;border:none windowtext 1.0pt;mso-border-alt:none windowtext 0in;
padding:0in'><a href="https://www.cs.purdue.edu/homes/aref/IDAS/hilda2019.pdf">Towards
an End-to-End Human-Centric Data Cleaning Framework [HILDA 2019].</a>&nbsp;</span></b><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'>Data Cleaning refers to the process of detecting
and fixing errors in the data. Human involvement is instrumental at several
stages of this process such as providing rules or validating computed repairs.
There is a plethora of data cleaning algorithms addressing a wide range of data
errors (e.g., detecting duplicates, violations of integrity constraints, and
missing values). Many of these algorithms involve a human in the loop, however,
this latter is usually coupled to the underlying cleaning algorithms. In a real
data cleaning pipeline, several data cleaning operations are performed using
different tools. A high-level reasoning on these tools, when combined to repair
the data, has the potential to unlock useful use cases to involve humans in the
cleaning process. Additionally, we believe there is an opportunity to benefit
from recent advances in active learning methods to minimize the effort humans
have to spend to verify data items produced by tools or humans. There is
currently no end-to-end data cleaning framework that systematically involves
humans in the cleaning pipeline regardless of the underlying cleaning
algorithms. In this research, we present opportunities that this framework
could offer, and highlight key challenges that need to be addressed to realize
this vision. We present a design vision and discuss scenarios that motivate the
need for this framework to judiciously assist humans in the cleaning
process.&nbsp;<o:p></o:p></span></p>

<p class=MsoNormal style='margin-top:.25in;margin-right:0in;margin-bottom:12.0pt;
margin-left:0in;mso-outline-level:3;vertical-align:baseline'><span
style='font-size:13.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:#303B53'>Undergraduate Research Projects<o:p></o:p></span></p>

<p class=MsoNormal style='line-height:15.0pt;vertical-align:baseline'><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'>Undergraduate students are gaining research and
development as well as systems-oriented experience in the context of this
project. One Ph.D. student is gaining training in conducted systems-oriented
research.&nbsp;<o:p></o:p></span></p>

<p class=MsoNormal style='margin-top:7.5pt;margin-right:0in;margin-bottom:7.5pt;
margin-left:0in;line-height:15.0pt;vertical-align:baseline'><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'>In the context of this project, Walid has
offered research opportunities during the Fall 2018 and Spring 2019 for the
following eight undergraduate students:<o:p></o:p></span></p>

<p class=MsoNormal style='margin-top:7.5pt;margin-right:0in;margin-bottom:7.5pt;
margin-left:0in;line-height:15.0pt;vertical-align:baseline'><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'>Daniel Hu, Daksh <span class=SpellE>Jotwani</span>,
Piyush <span class=SpellE>Juneja</span> (two semesters), Aaron <span
class=SpellE>Nuestedter</span> (two semesters), Harsh Patel, Peyton Puckett,
Logesh <span class=SpellE>Ramadoss</span>, and <span class=SpellE>Ruoyu</span>
Song.<o:p></o:p></span></p>

<p class=MsoNormal style='margin-top:7.5pt;margin-right:0in;margin-bottom:7.5pt;
margin-left:0in;line-height:15.0pt;vertical-align:baseline'><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'>The students worked in four groups:&nbsp;<o:p></o:p></span></p>

<p class=MsoNormal style='margin-top:7.5pt;margin-right:0in;margin-bottom:7.5pt;
margin-left:0in;line-height:15.0pt;vertical-align:baseline'><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'>-&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Group 1:
Daniel Hu and Peyton Puckett worked in the Tornado distributed in-memory
spatial keyword system along with a Ph.D. student from Walid’s group to develop
a running prototype of a demo system for Tornado. This involved introducing
Kafka between the front-end interfacing client of the system and the back-end
Apache Storm distributed streaming engine.<o:p></o:p></span></p>

<p class=MsoNormal style='margin-top:7.5pt;margin-right:0in;margin-bottom:7.5pt;
margin-left:0in;line-height:15.0pt;vertical-align:baseline'><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'>-&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Group 2:
Piyush <span class=SpellE>Juneja</span>, Aaron <span class=SpellE>Nuestedter</span>,
and Harsh Patel worked in the LIMO system along with a Ph.D. student from
Walid’s group to develop various aspects of LIMO. They introduced testing
capabilities and enforced coding conventions for Tornado, added publicly
available elevation data to the maps in the LIMO system, and developed video
documentation on how to use the LIMO system. Piyush later worked in developing
a generalized spatial-keyword index inside of PostgreSQL.<o:p></o:p></span></p>

<p class=MsoNormal style='margin-top:7.5pt;margin-right:0in;margin-bottom:7.5pt;
margin-left:0in;line-height:15.0pt;vertical-align:baseline'><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'>-&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Group 3: <span
class=SpellE>Ruoyu</span> Song worked with two graduate students from Walid’s
group, A. Mamun and M. Hassan to add new graph functions into the <span
class=SpellE>GRFusion</span> system.<o:p></o:p></span></p>

<p class=MsoNormal style='margin-top:7.5pt;margin-right:0in;margin-bottom:7.5pt;
margin-left:0in;line-height:15.0pt;vertical-align:baseline'><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'>-&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Group 4:
Daksh <span class=SpellE>Jotwani</span> (in Fall 2018) and Logesh <span
class=SpellE>Ramadoss</span> (in Spring 2019) working with one Ph.D. from
Walid’s group to realize an ML-based Spatial Index.<o:p></o:p></span></p>

<p class=MsoNormal style='margin-top:7.5pt;margin-right:0in;margin-bottom:7.5pt;
margin-left:0in;line-height:15.0pt;vertical-align:baseline'><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'>To ensure continuity, a graduate student, funded
under this project, followed up along with Walid the work of each the four
groups on weekly basis, and has been continuing this research in the hopes to
finish and publish this work.&nbsp;<o:p></o:p></span></p>

<p class=MsoNormal style='margin-top:7.5pt;margin-right:0in;margin-bottom:7.5pt;
margin-left:0in;line-height:15.0pt;vertical-align:baseline'><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'>The students maintained all their
project-related activities on GitHub under <span class=SpellE>PurdueDB</span>,
where they gained excellent experience working on relatively large
systems-oriented code bases.<o:p></o:p></span></p>

<p class=MsoNormal style='margin-top:7.5pt;margin-right:0in;margin-bottom:7.5pt;
margin-left:0in;line-height:15.0pt;vertical-align:baseline'><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'>In Fall 2018, Walid offered a graduate-level
seminar course on various project-related topics, where five students got
training on presenting and discussing research papers and in conducting a
semester-long project.<o:p></o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><span
style='font-size:10.5pt;font-family:"Arial",sans-serif;mso-fareast-font-family:
"Times New Roman";color:black'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><a
name=Y19><b><span style='font-size:13.5pt;font-family:"Arial",sans-serif;
mso-fareast-font-family:"Times New Roman";color:black'>2019-2020 Project
Activities:</span></b></a><span style='mso-bookmark:Y19'><b><span
style='font-size:13.5pt;font-family:"Times New Roman",serif'><o:p></o:p></span></b></span></p>

<span style='mso-bookmark:Y19'></span>

<p class=MsoNormal style='mso-margin-top-alt:auto;mso-margin-bottom-alt:auto;
background:white'><span style='font-size:10.5pt;font-family:"Times New Roman",serif;
mso-ascii-theme-font:minor-bidi;mso-hansi-theme-font:minor-bidi;mso-bidi-theme-font:
minor-bidi;color:black'>In 2019-2020, we have studied several aspects of
in-memory, distributed, and adaptive&nbsp;<span class=SpellE>spatio</span>-textual
query processing systems. These include <span class=SpellE>spatio</span>-textual
data analytics [SIGMOD 2020 Demo], on-line data partitioning [SIGMOD 2020 full
paper], ML-based on-line data partitioning using Reinforcement Learning [<span
class=SpellE>aiDM</span> 2020], a distributed system for <span class=SpellE>spatio</span>-textual
stream processing [PVLDB 2020], shared execution data analytics to address
scalability [SSDBM 2020], Grid/tree augmentation data structures for efficient
spatial query processing [ACM SIGSPATIAL 2020], and trend discovery in
micro-blogs over various space and time resolutions [<span class=SpellE>GeoInformatica</span>
2019]. Walid participated in a <span class=SpellE>Dagstuhl</span> Seminar in
December 2020.<o:p></o:p></span></p>

<p class=MsoNormal style='mso-margin-top-alt:auto;mso-margin-bottom-alt:auto;
background:white'><span style='font-size:10.5pt;font-family:"Times New Roman",serif;
mso-ascii-theme-font:minor-bidi;mso-hansi-theme-font:minor-bidi;mso-bidi-theme-font:
minor-bidi;color:black'>Over the Fall 2019 and Spring 2020 semesters Walid led
a group of undergraduate students to conduct undergraduate research in topics
related to this project. Walid graduated one Ph.D. student in the topic of
“Attack-Resilient Adaptive Load-Balancing in Distributed Spatial Data Streaming
Systems”, and trained six other Ph.D. students in project-related research.<o:p></o:p></span></p>

<p class=MsoNormal style='mso-margin-top-alt:auto;mso-margin-bottom-alt:auto;
background:white'><span style='font-size:10.5pt;font-family:"Times New Roman",serif;
mso-ascii-theme-font:minor-bidi;mso-hansi-theme-font:minor-bidi;mso-bidi-theme-font:
minor-bidi;color:black'>Details about these research and education activities
will be given below.&nbsp;<o:p></o:p></span></p>

<p class=MsoNormal style='mso-margin-top-alt:auto;mso-margin-bottom-alt:auto;
background:white'><b><span style='font-size:10.5pt;font-family:"Times New Roman",serif;
mso-ascii-theme-font:minor-bidi;mso-hansi-theme-font:minor-bidi;mso-bidi-theme-font:
minor-bidi;color:black'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/sigspatial2019.pdf">An
Investigation of Grid-enabled Tree Indexes for Spatial Query Processing. [ACM
SIGSPATIAL 2019]</a> </span></b><span style='font-size:10.5pt;font-family:"Times New Roman",serif;
mso-ascii-theme-font:minor-bidi;mso-hansi-theme-font:minor-bidi;mso-bidi-theme-font:
minor-bidi;color:black'>Two-dimensional tree-based spatial indexes (e.g., the
quadtree or the k-d tree) are commonly used for indexing spatial data. However,
both types of spatial indexes have limitations. Although two-dimensional trees
can handle skewed data, index traversal and tree maintenance can be expensive.
In contrast, spatial grids have low update overhead, but is not suitable for
skewed data. In this research, we investigate the augmentation of a grid into
tree-based indexing for spatial query processing. For this purpose, we
introduce the Grid-Enabled Tree index (GE-Tree, for short); a hybrid spatial
tree structure that augments a spatial grid to two-dimensional tree indexes. In
particular, we investigate the use of a grid at the leaf level of a
two-dimensional tree to facilitate tree navigation and maintenance.&nbsp;<o:p></o:p></span></p>

<p class=MsoNormal style='mso-margin-top-alt:auto;mso-margin-bottom-alt:auto;
background:white'><b><span style='font-size:10.5pt;font-family:"Times New Roman",serif;
mso-ascii-theme-font:minor-bidi;mso-hansi-theme-font:minor-bidi;mso-bidi-theme-font:
minor-bidi;color:black'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/sigmod-demo2020-pdfa.pdf">STAR:
A Distributed Stream Warehouse System for Spatial Data. [SIGMOD 2020 Demo]</a>&nbsp;</span></b><span
style='font-size:10.5pt;font-family:"Times New Roman",serif;mso-ascii-theme-font:
minor-bidi;mso-hansi-theme-font:minor-bidi;mso-bidi-theme-font:minor-bidi;
color:black'>Mobile and location-based services produce massive streams of
spatial and textual data. In order to enable spatial and textual data
analytics, spatial and textual data need to be streamed into a data stream
warehouse system that can provide real-time analytics over the incoming spatial
and textual data in the warehouse. A spatial data stream warehouse system
(DSWS) should be able to efficiently ingest the incoming data, and enable
online analytical processing (OLAP) over the streamed data. Existing DSWSs are
not tailored for spatial data. In this research, we introduce STAR; a spatial
data stream warehouse system. STAR is a distributed in-memory data stream
warehouse system that provides low-latency and up-to-date analytical results
over a fast-arriving spatial data stream. STAR supports both snapshot and
continuous queries that are composed of algebraic or holistic aggregate
functions and ad hoc query constraints over spatial, textual, and temporal data
attributes. STAR implements an effective view materialization algorithm, and
adopts a memory-efficient framework that facilitates the processing of streamed
data and the maintenance of materialized views.&nbsp;<o:p></o:p></span></p>

<p class=MsoNormal style='mso-margin-top-alt:auto;mso-margin-bottom-alt:auto;
background:white'><b><span style='font-size:10.5pt;font-family:"Times New Roman",serif;
mso-ascii-theme-font:minor-bidi;mso-hansi-theme-font:minor-bidi;mso-bidi-theme-font:
minor-bidi;color:black'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/sigmod2020-pdfa.pdf">Prompt: Dynamic
Data-Partitioning for Distributed Micro-batch Stream Processing Systems.<span
style='font-weight:normal'>&nbsp;[</span>SIGMOD 2020<span style='font-weight:
normal'>]</span></a></span></b><span style='font-size:10.5pt;font-family:"Times New Roman",serif;
mso-ascii-theme-font:minor-bidi;mso-hansi-theme-font:minor-bidi;mso-bidi-theme-font:
minor-bidi;color:black'> Advances in real-world applications require
high-throughput processing over large data streams. Micro-batching has been
proposed to support the needs of these applications. In micro-batching, the
processing and batching of the data are interleaved, where the incoming data
tuples are first buffered as data blocks, and then are processed collectively
using par- <span class=SpellE>allel</span> function constructs (e.g.,
Map-Reduce). The size of a micro-batch is set to guarantee a certain
response-time latency that is to conform to the application’s service-level
agreement. In contrast to tuple-at-a-time data stream processing,
micro-batching has the potential to sustain higher data rates. However,
existing micro-batch stream processing systems use basic data-partitioning
techniques that do not account for data skew and variable data rates.
Load-awareness is necessary to maintain performance and to enhance resource
utilization. A new data partitioning scheme, termed Prompt is presented that
leverages the characteristics of the micro-batch processing model. In the
batching phase, a frequency-aware buffering mechanism is introduced that
progressively maintains run-time statistics, and provides on-line key-based
sorting as data tuples arrive. Because achieving optimal data partitioning is NP-Hard
in this context, a workload-aware greedy algorithm is introduced that
partitions the buffered data tuples efficiently for the Map stage. In the
processing phase, a load-aware distribution mechanism is presented that
balances the size of the input to the Reduce stage without incurring inter-task
communication overhead. Moreover, Prompt elastically adapts resource
consumption according to workload changes.&nbsp;<o:p></o:p></span></p>

<p class=MsoNormal style='mso-margin-top-alt:auto;mso-margin-bottom-alt:auto;
background:white'><b><span style='font-size:10.5pt;font-family:"Times New Roman",serif;
mso-ascii-theme-font:minor-bidi;mso-hansi-theme-font:minor-bidi;mso-bidi-theme-font:
minor-bidi;color:black'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/aidm2020.pdf"><span
class=SpellE>PartLy</span>: Learning Data Partitioning for Distributed Data
Stream Processing [<span class=SpellE>aiDM</span> 2020]</a>&nbsp;</span></b><span
style='font-size:10.5pt;font-family:"Times New Roman",serif;mso-ascii-theme-font:
minor-bidi;mso-hansi-theme-font:minor-bidi;mso-bidi-theme-font:minor-bidi;
color:black'>In this research, we expand on our well-optimized Prompt online
data partitioning mechanism by using reinforcement learning to learn proper
data partitioning in a micro-batched data streaming setup. We realize that data
partitioning plays a critical role in data stream processing. Current data
partitioning techniques use simple, static heuristics that do not incorporate
feedback about the quality of the partitioning decision (i.e., fire and forget
strategy). Hence, the data partitioner often repeatedly chooses the same
decision. In this paper, we argue that reinforcement learning techniques can be
applied to address this problem. The use of artificial neural networks can
facilitate learning of efficient partitioning policies. We identify the
challenges that emerge when applying machine learning techniques to the data
partitioning problem for distributed data stream processing. Furthermore, we
introduce <span class=SpellE>PartLy</span>, a proof-of-concept data
partitioner, and present preliminary results that indicate <span class=SpellE>PartLy’s</span>
potential to match the performance of state-of-the-art techniques in terms of
partitioning quality, while minimizing storage and processing overheads.&nbsp;<o:p></o:p></span></p>

<p class=MsoNormal style='mso-margin-top-alt:auto;mso-margin-bottom-alt:auto;
background:white'><b><span style='font-size:10.5pt;font-family:"Times New Roman",serif;
mso-ascii-theme-font:minor-bidi;mso-hansi-theme-font:minor-bidi;mso-bidi-theme-font:
minor-bidi;color:black'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/vldb2020-pdfa.pdf">SSTD: A
Distributed System on Streaming <span class=SpellE>Spatio</span>-Textual Data
[PVLDB 2020]</a>.&nbsp;</span></b><span style='font-size:10.5pt;font-family:
"Times New Roman",serif;mso-ascii-theme-font:minor-bidi;mso-hansi-theme-font:
minor-bidi;mso-bidi-theme-font:minor-bidi;color:black'>Streaming <span
class=SpellE>spatio</span>-textual data that contains geolocations and textual
contents, e.g., geo-tagged tweets, is becoming increasingly available. Users
can register continuous queries to receive up-to-date results continuously, or
pose snapshot queries to receive results instantly. The large scale of <span
class=SpellE>spatio</span>-textual data streams and huge amounts of queries
pose great challenges to the current location-based services, and call for more
efficient data management systems. In this research, we realize SSTD Streaming <span
class=SpellE>Spatio</span>-Textual Data, a distributed in-memory system
supporting both continuous and snapshot queries with spatial, textual, and
temporal constraints over data streams. Compared with existing distributed data
stream management systems, SSTD has three novel aspects: (1) It supports many
types of queries over <span class=GramE>streamed&nbsp;&nbsp;<span class=SpellE>spatio</span></span>-textual
data; (2) SSTD adopts a new workload partitioning method, termed QT (Quad-Text)
tree, that utilizes the joint distribution of queries and <span class=SpellE>spatio</span>-textual
data to reduce query latency and enhance system throughput. (3) To achieve load
balance and robustness, we develop three new workload adjustment methods for
SSTD to fit the changes in the distributions of data or queries. Extensive
experiments on real-life datasets demonstrate the superior performance of SSTD.<o:p></o:p></span></p>

<p class=MsoNormal style='mso-margin-top-alt:auto;mso-margin-bottom-alt:auto;
background:white'><b><span style='font-size:10.5pt;font-family:"Times New Roman",serif;
mso-ascii-theme-font:minor-bidi;mso-hansi-theme-font:minor-bidi;mso-bidi-theme-font:
minor-bidi;color:black'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/geoinformatica2020.pdf">Local
Trend Discovery on Real-time Microblogs with Uncertain Locations in Tight
Memory Environments. [<span class=SpellE>GeoInformatica</span> 2019]</a>&nbsp;</span></b><span
style='font-size:10.5pt;font-family:"Times New Roman",serif;mso-ascii-theme-font:
minor-bidi;mso-hansi-theme-font:minor-bidi;mso-bidi-theme-font:minor-bidi;
color:black'>In this research, we developed <span class=SpellE>GeoTrend</span>+;
a system approach to support scalable local trend discovery on recent
microblogs, e.g., tweets, comments, online reviews, and check-ins, that come in
real time. <span class=SpellE>GeoTrend</span>+ discovers top-k trending
keywords in arbitrary spatial regions from recent microblogs that continuously
arrive with high rates and a significant portion has uncertain geolocations. <span
class=SpellE>GeoTrend</span>+ distinguishes itself from existing techniques in
different aspects: (1) Discovering trends in arbitrary spatial regions, e.g.,
city blocks. (2) Considering both exact geolocations, e.g., accurate
latitude/longitude coordinates, and uncertain geolocations, e.g.,
district-level or city-level, that represents a significant portion of past
years microblogs. (3) Promoting recent microblogs as first-class citizens and
optimizes different components to digest a continuous flow of fast data in
main-memory while removing old data efficiently. (4) Providing various
main-memory optimization techniques that are able to distinguish useful from
useless data to effectively utilize tight memory resources while maintaining
accurate query results on relatively large amounts of data. (5) Supporting
various trending measures that effectively capture trending items under a
variety of definitions that suit different applications. <span class=SpellE>GeoTrend</span>+
limits its scope to real-time data that is posted during the last T time units.
To support its queries efficiently, <span class=SpellE>GeoTrend</span>+ employs
an in-memory spatial index that is able to efficiently digest incoming data and
expire data that is beyond the last T time units. The index also materializes
top-k keywords in different spatial regions so that incoming queries can be
processed with low latency. In peak times, the main-memory optimization
techniques are employed to shed less important data to sustain high query
accuracy with limited memory resources. Experimental results based on real data
and queries show the scalability of <span class=SpellE>GeoTrend</span>+ to
support high arrival rates and low query response time, and at least 90+% query
accuracy even under limited memory resources.<o:p></o:p></span></p>

<p class=MsoNormal style='mso-margin-top-alt:auto;mso-margin-bottom-alt:auto;
background:white'><b><span style='font-size:10.5pt;font-family:"Times New Roman",serif;
mso-ascii-theme-font:minor-bidi;mso-hansi-theme-font:minor-bidi;mso-bidi-theme-font:
minor-bidi;color:black'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/ssdbm2020-pdfa.pdf">Shared Execution
Techniques for Business Data Analytics over Big Data Streams. [SSDBM 2020]</a>&nbsp;</span></b><span
style='font-size:10.5pt;font-family:"Times New Roman",serif;mso-ascii-theme-font:
minor-bidi;mso-hansi-theme-font:minor-bidi;mso-bidi-theme-font:minor-bidi;
color:black'>Data Analytics require processing of large numbers of data streams
and create materialized views in order to provide near real-time answers to
user queries. Materializing the view of each query and refreshing it
continuously as a separate query execution plan is not efficient and is not
scalable. In this research, we present a global query execution plan to
simultaneously support multiple queries, and minimize the number of input
scans, operators, and tuples flowing between the operators. We propose shared-execution
techniques for creating and maintaining materialized views in support of
business data analytics queries as an example. We utilize commonalities in
multiple business data analytics queries to support scalable and efficient
processing of big data streams. We analyze the cost and elasticity of various
shared-execution query-processing techniques in a distributed environment. The
paper highlights shared execution techniques for select predicates, group, and
aggregate calculations. We present how global query execution plans are run in
a distributed stream processing system that is built on top of cluster-based
data streaming engine.&nbsp;<o:p></o:p></span></p>

<p class=MsoNormal style='mso-margin-top-alt:auto;mso-margin-bottom-alt:auto;
background:white'><strong><span style='font-size:10.5pt;font-family:"Arial",sans-serif;
color:black;border:none windowtext 1.0pt;mso-border-alt:none windowtext 0in;
padding:0in'>Training and Professional Development</span></strong><strong><span
style='font-family:"Arial",sans-serif;border:none windowtext 1.0pt;mso-border-alt:
none windowtext 0in;padding:0in'><o:p></o:p></span></strong></p>

<p class=MsoNormal style='mso-margin-top-alt:auto;mso-margin-bottom-alt:auto;
background:white'><strong><span style='font-size:10.5pt;font-family:"Arial",sans-serif;
color:black;border:none windowtext 1.0pt;mso-border-alt:none windowtext 0in;
padding:0in;font-weight:normal'>1. Undergraduate Research Opportunities<o:p></o:p></span></strong></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'>In the context of this project, Walid has offered research
opportunities during the Fall 2019 and Spring 2020 for the following five
undergraduate students (Two female and three male students):<o:p></o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'>Piyush <span class=SpellE>Juneja</span> (Graph Partitioning
Algorithms), <span class=SpellE>Nameer</span> A. Qureshi (Big Spatial Data
Systems), <span class=SpellE>Dhanushikka</span> <span class=SpellE>Ravichandiran</span>
(Database Concurrency Control Algorithms), Hao Wu (ML-based Learned Data
Indexing), <span class=SpellE>Shotobhisha</span> Sinha Ray (Big Data Systems).<o:p></o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'>The students worked in four groups: <o:p></o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'>- Group 1: Piyush <span class=SpellE>Juneja</span> worked in
surveying graph partitioning algorithms.<o:p></o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'>- Group 2: <span class=SpellE>Nameer</span> Qureshi
developed a web site for all <span class=SpellE>spatio</span>-temporal access
methods and their corresponding published papers. <o:p></o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'>- Group 3: <span class=SpellE>Shotobhisha</span> Sinha Ray
and <span class=SpellE>Dhanushikka</span> <span class=SpellE>Ravichandiran</span>
studied and surveyed various Database Concurrency Control Algorithms.<o:p></o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'>- Group 4: Hao We surveyed the topic of learned indexes with
focus on the multi-dimensional case.<o:p></o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'>To ensure continuity, graduate students from Walid’s group
along with Walid, followed up the work of each of the four groups on weekly
basis (one graduate student per group), and has been continuing this research
in the hopes to finish and publish this work. <o:p></o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'>Of mention is the survey on multi-dimensional learned
indexes which has been accepted as a tutorial in the ACM SIGSPATIAL 2020
Conference. Both Hao Wu (Undergraduate) and Abdullah Al Mamun (Ph.D. student)
will be presenting this tutorial along with Walid at the conference.<o:p></o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'>Graduate Research Opportunities:<o:p></o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'>For graduate students, in Fall 2019 and Spring 2020, Walid
has offered several research training opportunities as graduate-level PhD
research and independent study courses that involve various project-related
topics, where several students got training on presenting and discussing
research papers and in conducting a semester-long project. These students
include:<o:p></o:p></span></p>

<p class=MsoListParagraphCxSpFirst style='text-indent:-.25in;mso-list:l1 level1 lfo2'><![if !supportLists]><span
style='font-family:Symbol;mso-fareast-font-family:Symbol;mso-bidi-font-family:
Symbol'><span style='mso-list:Ignore'>·<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span></span><![endif]><span dir=LTR></span><span style='font-family:
"Times New Roman",serif;mso-fareast-font-family:"Times New Roman"'>Amira <span
class=SpellE>Mamoun</span> (Dataset Discovery Techniques)<o:p></o:p></span></p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-list:l1 level1 lfo2'><![if !supportLists]><span
style='font-family:Symbol;mso-fareast-font-family:Symbol;mso-bidi-font-family:
Symbol'><span style='mso-list:Ignore'>·<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span></span><![endif]><span dir=LTR></span><span class=SpellE><span
style='font-family:"Times New Roman",serif;mso-fareast-font-family:"Times New Roman"'>Jaewoo</span></span><span
style='font-family:"Times New Roman",serif;mso-fareast-font-family:"Times New Roman"'>
Shin (Update-tolerant LSM-based Spatial Indexing)<o:p></o:p></span></p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-list:l1 level1 lfo2'><![if !supportLists]><span
style='font-family:Symbol;mso-fareast-font-family:Symbol;mso-bidi-font-family:
Symbol'><span style='mso-list:Ignore'>·<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span></span><![endif]><span dir=LTR></span><span style='font-family:
"Times New Roman",serif;mso-fareast-font-family:"Times New Roman"'>Abdullah Al
Mamun (Learned Spatial Indexing)<o:p></o:p></span></p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-list:l1 level1 lfo2'><![if !supportLists]><span
style='font-family:Symbol;mso-fareast-font-family:Symbol;mso-bidi-font-family:
Symbol'><span style='mso-list:Ignore'>·<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span></span><![endif]><span dir=LTR></span><span style='font-family:
"Times New Roman",serif;mso-fareast-font-family:"Times New Roman"'>Ahmed
Abdelhamid (Intelligent Data Partitioning in Micro-batched Big Data Streaming
Systems)<o:p></o:p></span></p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-list:l1 level1 lfo2'><![if !supportLists]><span
style='font-family:Symbol;mso-fareast-font-family:Symbol;mso-bidi-font-family:
Symbol'><span style='mso-list:Ignore'>·<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span></span><![endif]><span dir=LTR></span><span style='font-family:
"Times New Roman",serif;mso-fareast-font-family:"Times New Roman"'>Lu Xing (Concurrency
Control and Query Optimization in Graph Data Management Systems)<o:p></o:p></span></p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-list:l1 level1 lfo2'><![if !supportLists]><span
style='font-family:Symbol;mso-fareast-font-family:Symbol;mso-bidi-font-family:
Symbol'><span style='mso-list:Ignore'>·<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span></span><![endif]><span dir=LTR></span><span class=SpellE><span
style='font-family:"Times New Roman",serif;mso-fareast-font-family:"Times New Roman"'>Ruihong</span></span><span
style='font-family:"Times New Roman",serif;mso-fareast-font-family:"Times New Roman"'>
Wang (RDMA-based Big Data Systems)<o:p></o:p></span></p>

<p class=MsoListParagraphCxSpLast style='text-indent:-.25in;mso-list:l1 level1 lfo2'><![if !supportLists]><span
style='font-family:Symbol;mso-fareast-font-family:Symbol;mso-bidi-font-family:
Symbol'><span style='mso-list:Ignore'>·<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;
</span></span></span><![endif]><span dir=LTR></span><span style='font-family:
"Times New Roman",serif;mso-fareast-font-family:"Times New Roman"'>Serkan <span
class=SpellE>Uzunbaz</span> (Shared Execution for Data Analytics over Big Data
Streams) <o:p></o:p></span></p>

<p class=MsoNormal style='margin-left:.25in'><span style='font-family:"Times New Roman",serif;
mso-fareast-font-family:"Times New Roman"'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='margin-left:.25in'><span style='font-family:"Times New Roman",serif;
mso-fareast-font-family:"Times New Roman"'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='margin-left:.25in'><span style='font-family:"Times New Roman",serif;
mso-fareast-font-family:"Times New Roman"'>Walid has graduated one Ph.D.
student, Anas <span class=SpellE>Daghistani</span>, co-advised with Professor <span
class=SpellE>Arif</span> Ghafoor (ECE) in the topic of “Attack-Resilient
Adaptive Load-Balancing in Distributed Spatial Data Streaming Systems”, in the
context of this project. This research is currently under review for journal
publication. <o:p></o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-layout-grid-align:none;text-autospace:none'><a
name=Y20><b><span style='font-family:"Times New Roman",serif;mso-ascii-theme-font:
major-bidi;mso-fareast-font-family:"Times New Roman";mso-hansi-theme-font:major-bidi;
mso-bidi-theme-font:major-bidi;color:black'>2020-2021 Project Activities: <o:p></o:p></span></b></a></p>

<span style='mso-bookmark:Y20'></span>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-ascii-theme-font:
major-bidi;mso-fareast-font-family:"Times New Roman";mso-hansi-theme-font:major-bidi;
mso-bidi-theme-font:major-bidi'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black;border:none windowtext 1.0pt;
mso-border-alt:none windowtext 0in;padding:0in'>In 2020-2021, we had several
research and education activities in the context of this project. We have
addressed the scalability challenge in real-time location services by
developing SWARM, a light-weight adaptivity protocol that continuously monitors
the data and query workloads across the distributed processes of the spatial
data streaming system, and redistribute and rebalance the workloads soon as
performance bottlenecks get detected. SWARM has been published in the ACM
Transactions on Spatial Algorithms and Systems [ACM TSAS 2021]. We have
investigated the adaptation of Log Structured Merge trees to support frequent
updates in moving-object spatial databases that has been published in the IEEE
International Conference on Data Engineering [ICDE 2021]. Along with
undergraduate and graduate students, we presented a tutorial on the subject of
learned multi-dimensional indexes in the 2020 ACM SIGSPATIAL Conference [ACM
SIGSPATIAL 2020a]. We developed an online workload estimation technique that
relies on a probabilistic model for estimating the workload of partitions and
machines in a distributed spatial data streaming system [ACM SIGSPATIAL 2020b].
We developed an unbiased online sampling for the visual exploration of large
spatiotemporal data that was published in the IEEE Visualization Conference
[VAST 2020]. </span><span style='font-family:"Times New Roman",serif;
mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:
major-bidi;color:black;background:white'>We have developed&nbsp;<span
class=SpellE>LocationSpark</span>, a query executor, and an optimizer based on
Spark to improve the query execution plan generated for spatial queries. The
design and performance of <span class=SpellE>LocationSpark</span> were published
in the Frontiers in Big Data [Frontiers 2020].<o:p></o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black;background:white'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-ascii-theme-font:
major-bidi;mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;
color:black'>Walid introduced a project-based research component in the
graduate-level database systems course at Purdue that has benefitted over 35
students. He mentored an undergraduate student to conduct undergraduate
research in topics related to this project. In 2020/2021 Walid graduated one
Ph.D. student in the topic of “Efficient Distributed Processing over
Micro-Batched Data Streams”, and trained seven other Ph.D. students in
project-related research. <o:p></o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black;border:none windowtext 1.0pt;
mso-border-alt:none windowtext 0in;padding:0in'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black;border:none windowtext 1.0pt;
mso-border-alt:none windowtext 0in;padding:0in'>Below, we highlight each of
these contributions and other project’s research, education, and training
activities.<o:p></o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black;border:none windowtext 1.0pt;
mso-border-alt:none windowtext 0in;padding:0in'><span
style='mso-spacerun:yes'> </span><o:p></o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><b><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/tsas2021-a.pdf">SWARM: Adaptive
Load Balancing in Distributed Streaming Systems for Big Spatial Data. [ACM TSAS
2021]</a> </span></b><span style='font-family:"Times New Roman",serif;
mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:
major-bidi;color:black'>As clearly from the scale of location services, their
ubiquity, and the massive amounts of spatial data being generated in real-time,
the current scale of spatial data cannot be handled using centralized systems.
This has led to the development of distributed spatial streaming systems.
Existing systems use static spatial partitioning to distribute the workload. In
contrast, the real-time streamed spatial data follows non-uniform spatial
distributions that are continuously changing over time. Distributed spatial
streaming systems need to react to the changes in the distribution of spatial
data and queries. This research introduces SWARM, a light-weight adaptivity
protocol that continuously monitors the data and query workloads across the
distributed processes of the spatial data streaming system, and redistribute
and rebalance the workloads soon as performance bottlenecks get detected. SWARM
is able to handle multiple query-execution and data-persistence models. A
distributed streaming system can directly use SWARM to adaptively rebalance the
system's workload among its machines with minimal changes to the original code
of the underlying spatial application. Extensive experimental evaluation using
real and synthetic datasets illustrate that, on average, SWARM achieves 200%
improvement over a static grid partitioning that is determined based on
observing a limited history of the data and query workloads. Moreover, SWARM
reduces execution latency on average 4x compared with other existing
techniques.<b><o:p></o:p></b></span></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><b><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/matrel2021-a.pdf">Scalable
Relational Query Processing on Big Matrix Data [Submitted 2021]</a> </span></b><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>The
use of large-scale machine learning methods is becoming ubiquitous in many
applications ranging from business intelligence to self-driving cars. These
methods require a complex computation pipeline consisting of various types of
operations, e.g., relational operations for pre-processing or post-processing
the dataset, and matrix operations for core model computations. Many existing
systems focus on efficiently processing matrix-only operations, and assume that
the inputs to the relational operators are already pre-computed and are
materialized as intermediate matrices. However, the input to a relational
operator may be complex in machine learning pipelines, and may involve various
combinations of matrix operators. Hence, it is critical to realize scalable and
efficient relational query processors that directly operate on big matrix data.
This research develops new efficient and scalable relational query processing
techniques on big matrix data for in- memory distributed clusters. The proposed
techniques leverage algebraic transformation rules to rewrite query execution
plans into ones with lower computation costs. A distributed query plan
optimizer exploits the sparsity-inducing property of merge functions as well as
Bloom join strategies for efficiently evaluating various flavors of the <span
class=SpellE>join</span> operation. Furthermore, optimized partitioning schemes
for the input matrices are developed to facilitate the performance of join
operations based on a cost model that minimizes the communication overhead. The
proposed relational query processing techniques are prototyped in Apache Spark.
Experiments on both real and synthetic data demonstrate that the proposed
techniques achieve up to two orders of magnitude performance improvement over
state-of-the-art systems on a wide range of applications. <b><o:p></o:p></b></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-ascii-theme-font:
major-bidi;mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;
color:black'><br>
<b><span style='background:white'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/icde2021-a.pdf">The LSM
RUM-Tree: A Log Structured Merge R-Tree for Update-intensive Spatial Workloads
[ICDE 2021]</a> </span></b><span style='background:white'>Many applications require
update-intensive workloads on spatial objects, e.g., social-network services
and shared-riding services that track moving objects (devices). By buffering
insert and delete operations in memory, the Log Structured Merge Tree (LSM) has
been used widely in various systems because of its ability to handle
insert-intensive workloads. While the focus on LSM has been on key-value stores
and their optimizations, there is a need to study how to efficiently support
LSM-based <i>secondary </i>indexes. We investigate the augmentation of a
main-memory-based memo structure into an LSM secondary index structure to
handle update-intensive workloads efficiently. We conduct this study in the
context of an R-tree-based secondary index. In particular, we introduce the LSM
RUM-tree that demonstrates the use of an Update Memo in an LSM-based R-tree to
enhance the performance of the R-tree’s insert, delete, update, and search
operations. The LSM RUM-tree introduces novel strategies to reduce the size of
the Update Memo to be a light-weight in-memory structure that is suitable for
handling update-intensive workloads without introducing significant overhead. <b><o:p></o:p></b></span></span></p>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-ascii-theme-font:
major-bidi;mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;
color:black;background:white'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal><b><span style='font-family:"Times New Roman",serif;
mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:
major-bidi;color:black;background:white'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/tutorialsigspatial2020-a.pdf">A
Tutorial on Learned Multi-dimensional Indexes [ACM SIGSPATIAL 2020]</a> </span></b><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black;
background:white'>Recently, Machine Learning (ML, for short) has been
successfully applied to database indexing. Initial experimentation on Learned
Indexes has demonstrated better search performance and lower space requirements
than their traditional database counterparts. Numerous attempts have been
explored to extend learned indexes to the multi-dimensional space. This makes
learned indexes potentially suitable for spatial databases. The goal of this
tutorial is to provide up-to-date coverage of learned indexes both in the
single and multi-dimensional spaces. The tutorial covers over 25 learned
indexes. The tutorial navigates through the space of learned indexes through a
taxonomy that helps classify the covered learned indexes both in the single and
multi-dimensional spaces. <b><o:p></o:p></b></span></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal><b><span style='font-family:"Times New Roman",serif;
mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:
major-bidi;color:black;background:white'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/sigspatial2020-a.pdf"><span
class=SpellE>TrioStat</span>: Online Workload Estimation in Distributed Spatial
Data Streaming Systems<span style='font-weight:normal'> </span>[ACM SIGSPATIAL
2020]</a> </span></b><span style='font-family:"Times New Roman",serif;
mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:
major-bidi;color:black'>The wide spread of GPS-enabled devices and the Internet
of Things (IoT) has increased the amount of spatial data being generated every second.
The current scale of spatial data cannot be handled using centralized systems.
This has led to the development of distributed spatial data streaming systems
that scale to process in real-time large amounts of streamed spatial data. The
performance of distributed streaming systems relies on how even the workload is
distributed among their machines. However, it is challenging to estimate the
workload of each machine because spatial data and query streams are skewed and
rapidly change with time and users’ interests. Moreover, a distributed spatial
streaming system often does not maintain a global system workload state because
it requires high network and processing overheads to be collected from the
machines in the system. In this research, we introduce <span class=SpellE>TrioStat</span>;
an online workload estimation technique that relies on a probabilistic model
for estimating the workload of partitions and machines in a distributed spatial
data streaming system. It is infeasible to collect and exchange statistics with
a centralized unit because it requires high network overhead. Instead, <span
class=SpellE>TrioStat</span> uses a decentralized technique to collect and
maintain the required statistics in real-time locally in each machine. <span
class=SpellE>TrioStat</span> enables distributed spatial data streaming systems
to com- pare the workloads of machines as well as the workloads of data
partitions. <span class=SpellE>TrioStat</span> requires minimal network and
storage overhead. Moreover, the required storage is distributed across the
system’s machines. <b><span style='background:white'><o:p></o:p></span></b></span></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal><b><span style='font-family:"Times New Roman",serif;
mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:
major-bidi;color:black;background:white'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/vast2020-a.pdf">STULL: Unbiased
Online Sampling for Visual Exploration of Large Spatiotemporal Data [VAST 2020]</a></span></b><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black;
background:white'> Online sampling-supported visual analytics is increasingly
important, as it allows users to explore large datasets with acceptable
approximate answers at interactive rates. However, existing online
spatiotemporal sampling techniques are often biased, as most re- searchers have
primarily focused on reducing computational latency. Biased sampling approaches
select data with unequal probabilities and produce results that do not match
the exact data distribution, leading end users to incorrect interpretations. In
this research, we propose a novel approach to perform unbiased online sampling
of large spatiotemporal data. The proposed approach ensures the same prob-
ability of selection to every point that qualifies the specifications of a
user’s multidimensional query. To achieve unbiased sampling for accurate
representative interactive visualizations, we design a novel data index and an
associated sample retrieval plan. Our proposed sampling approach is suitable
for a wide variety of visual analytics tasks, e.g., tasks that run aggregate
queries of spatiotemporal data. Extensive experiments confirm the superiority
of our approach over a state-of-the-art spatial online sampling technique,
demonstrating that within the same computational time, data samples generated
in our approach are at least 50% more accurate in representing the actual
spatial distribution of the data and enable approximate visualizations to
present closer visual appearances to the exact ones. <o:p></o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><b><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/frontiers2020-a.pdf"><span
class=SpellE>LocationSpark</span>: In-memory Distributed Spatial Query
Processing and Optimization [Frontiers 2020]</a> </span></b><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>Due
to the ubiquity of spatial data applications and the large amounts of spatial
data that these applications generate and process, there is a pressing need for
scalable spatial query processing. In this research, we develop new techniques
for spatial query processing and optimization in an in-memory and distributed
setup to address scalability. More specifically, we introduce new techniques
for handling query skew that commonly happens in practice, and minimizes
communication costs accordingly. We propose a distributed query scheduler that
uses a new cost model to minimize the cost of spatial query processing. The
scheduler generates query execution plans that minimize the effect of query
skew. The query scheduler utilizes new spatial indexing techniques based on
bitmap filters to forward queries to the appropriate local nodes. Each local
computation node is responsible for optimizing and selecting its best local
query execution plan based on the indexes and the nature of the spatial queries
in that node. All the proposed spatial query processing and optimization
techniques are prototyped inside Spark, a distributed memory-based computation
system. Our prototype system is termed <span class=SpellE>LocationSpark</span>.
The experimental study is based on real datasets and demonstrates that <span
class=SpellE>LocationSpark</span> can enhance distributed spatial query
processing by up to an order of magnitude over existing in-memory and
distributed spatial systems.<o:p></o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='mso-margin-top-alt:auto;mso-margin-bottom-alt:auto;
background:white'><strong><span style='mso-ascii-font-family:"Times New Roman";
mso-ascii-theme-font:major-bidi;mso-hansi-font-family:"Times New Roman";
mso-hansi-theme-font:major-bidi;mso-bidi-font-family:"Times New Roman";
mso-bidi-theme-font:major-bidi;color:black;border:none windowtext 1.0pt;
mso-border-alt:none windowtext 0in;padding:0in'>Training and Professional
Development</span></strong><b><span style='font-family:"Times New Roman",serif;
mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:
major-bidi;border:none windowtext 1.0pt;mso-border-alt:none windowtext 0in;
padding:0in'><o:p></o:p></span></b></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'>One Ph.D. student, Ahmed
S. Abdelhamid, has graduated who was partially funded under this project. His
dissertation topic is:&nbsp;Efficient Distributed Processing over Micro-Batched
Data Streams. Student <span class=SpellE>Nameer</span> Qureshi took a graduate
independent study course on topics related to this project.<o:p></o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'>In Fall 2020, I revised
the project component of the graduate-level database systems course (CS541) to
allow for new research opportunities and training of graduate students be
semester-long group research projects of three students each. Each group agrees
on a project from a list of potential projects that I provided to them (List is
given below). Projects vary in nature to match the various orientations of the
students. Some projects are survey-oriented while others are research-oriented
with heavy programming components. Projects cover a broad spectrum of research
topics. 39 students benefitted from this opportunity and formed 13 group
projects that met with Walid on weekly and biweekly bases. Two of these
projects have resulted in submitted conference papers that are under review,
and another paper is currently being prepared. I had some collaborators from
industrial companies, e.g., Google, Uber, and Facebook, to help collaborate in
the projects, and provide the students an industrial twist. Student feedback
was positive as many of them appreciated this research experience and the close
follow-up and feedback I provided on their biweekly or weekly
progressions.&nbsp;<o:p></o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'>Projects provided
included:&nbsp;&nbsp;<o:p></o:p></span></p>

<p class=MsoNormal style='text-indent:.5in;vertical-align:baseline'><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>(1)
A survey of 50 years of database models<o:p></o:p></span></p>

<p class=MsoNormal style='text-indent:.5in;vertical-align:baseline'><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>(2)
Studying and comparing the performance of the disk page and record layouts of
PostgreSQL, MySQL, and SQLite<o:p></o:p></span></p>

<p class=MsoNormal style='text-indent:.5in;vertical-align:baseline'><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>(3)
Studying and comparing the performance of the table directory structures and
free-space management for PostgreSQL, MySQL, and SQLite <o:p></o:p></span></p>

<p class=MsoNormal style='text-indent:.5in;vertical-align:baseline'><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>(4)
Surveying of SSD and persistent memory storage technologies, their properties,
and how they impact on query processing techniques, index design, concurrency,
and recovery<o:p></o:p></span></p>

<p class=MsoNormal style='text-indent:.5in;vertical-align:baseline'><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>(5)
Query compilation techniques for graph data systems<o:p></o:p></span></p>

<p class=MsoNormal style='text-indent:.5in;vertical-align:baseline'><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>(6)
Handling bulk-loading anomalies in spatial indexing techniques (is leading to a
conference paper publication)<o:p></o:p></span></p>

<p class=MsoNormal style='text-indent:.5in;vertical-align:baseline'><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>(7)
Realizing an updatable compressed bitmap index<o:p></o:p></span></p>

<p class=MsoNormal style='text-indent:.5in;vertical-align:baseline'><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>(8)
Implementing different concurrency control protocols in RDMA and evaluating
their tradeoffs<o:p></o:p></span></p>

<p class=MsoNormal style='text-indent:.5in;vertical-align:baseline'><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>(9)
Studying RDMA-based distributed transaction management and realizing an
RDMA-based two phase commit protocol, <o:p></o:p></span></p>

<p class=MsoNormal style='text-indent:.5in;vertical-align:baseline'><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>(10)
Surveying multi-model database system techniques<o:p></o:p></span></p>

<p class=MsoNormal style='text-indent:.5in;vertical-align:baseline'><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>(11)
Studying and comparing techniques for supporting high-dimensional vector
databases<o:p></o:p></span></p>

<p class=MsoNormal style='text-indent:.5in;vertical-align:baseline'><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>(12)
Decoupling the storage engine from the compute engine in MySQL<o:p></o:p></span></p>

<p class=MsoNormal style='text-indent:.5in;vertical-align:baseline'><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>(13)
Realizing a new algorithm for answering k-nearest-neighbor queries based on a
newly published external merge sort in spatial data systems (is leading to a
conference publication)<o:p></o:p></span></p>

<p class=MsoNormal style='text-indent:.5in;vertical-align:baseline'><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>(14)
Designing and implementing various memory-based indexing techniques over RDMA
that support concurrency.<o:p></o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'>There were 39 students
in class that formed 13 groups. I met biweekly with every group for 30 minutes
each over Zoom. Some&nbsp;groups wanted to be more productive by meeting weekly
in contrast to biweekly and I accommodated that. The students&nbsp;demonstrated
their weekly progress in the project in the form of slide-show presentations
that the students have prepared for&nbsp;every meeting, and/or if need be,
showed program code or performance studies and results.<o:p></o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'>For graduate students,
in Fall 2020 and Spring 2021, Walid has offered several research training
opportunities as graduate-level PhD research and independent study courses that
involve various project-related topics, where several students got training on
presenting and discussing research papers and in conducting a semester-long
project. These students include <o:p></o:p></span></p>

<p class=MsoListParagraphCxSpFirst style='text-indent:-.25in;mso-list:l0 level1 lfo4;
vertical-align:baseline'><![if !supportLists]><span style='font-family:"Times New Roman",serif;
mso-ascii-theme-font:major-bidi;mso-fareast-font-family:"Times New Roman";
mso-fareast-theme-font:major-bidi;mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:
major-bidi;color:black'><span style='mso-list:Ignore'>1.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span></span><![endif]><span dir=LTR></span><span class=SpellE><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>Jaewoo</span></span><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>
Shin (Update-tolerant LSM-based Spatial Indexing – resulted in an ICDE 2021
paper)<o:p></o:p></span></p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-list:l0 level1 lfo4;
vertical-align:baseline'><![if !supportLists]><span style='font-family:"Times New Roman",serif;
mso-ascii-theme-font:major-bidi;mso-fareast-font-family:"Times New Roman";
mso-fareast-theme-font:major-bidi;mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:
major-bidi;color:black'><span style='mso-list:Ignore'>2.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span></span><![endif]><span dir=LTR></span><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'>Abdullah Al Mamun (Learned
Spatial Indexing – resulted in a conference paper submission)<o:p></o:p></span></p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-list:l0 level1 lfo4;
vertical-align:baseline'><![if !supportLists]><span style='font-family:"Times New Roman",serif;
mso-ascii-theme-font:major-bidi;mso-fareast-font-family:"Times New Roman";
mso-fareast-theme-font:major-bidi;mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:
major-bidi;color:black'><span style='mso-list:Ignore'>3.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span></span><![endif]><span dir=LTR></span><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'>Ahmed Abdelhamid
(Intelligent Data Partitioning in Micro-batched Big Data Streaming Systems –
resulted in a conference paper submission)<o:p></o:p></span></p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-list:l0 level1 lfo4;
vertical-align:baseline'><![if !supportLists]><span style='font-family:"Times New Roman",serif;
mso-ascii-theme-font:major-bidi;mso-fareast-font-family:"Times New Roman";
mso-fareast-theme-font:major-bidi;mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:
major-bidi;color:black'><span style='mso-list:Ignore'>4.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span></span><![endif]><span dir=LTR></span><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'>Lu Xing (two projects:
Concurrency Control in Graph Data Management Systems, and Waves of Misery in
R-trees – resulted in a conference paper submission)<o:p></o:p></span></p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-list:l0 level1 lfo4;
vertical-align:baseline'><![if !supportLists]><span style='font-family:"Times New Roman",serif;
mso-ascii-theme-font:major-bidi;mso-fareast-font-family:"Times New Roman";
mso-fareast-theme-font:major-bidi;mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:
major-bidi;color:black'><span style='mso-list:Ignore'>5.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span></span><![endif]><span dir=LTR></span><span class=SpellE><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>Ruihong</span></span><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>
Wang (RDMA-based Big Data Systems – resulted in a conference paper submission)<o:p></o:p></span></p>

<p class=MsoListParagraphCxSpMiddle style='text-indent:-.25in;mso-list:l0 level1 lfo4;
vertical-align:baseline'><![if !supportLists]><span style='font-family:"Times New Roman",serif;
mso-ascii-theme-font:major-bidi;mso-fareast-font-family:"Times New Roman";
mso-fareast-theme-font:major-bidi;mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:
major-bidi;color:black'><span style='mso-list:Ignore'>6.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span></span><![endif]><span dir=LTR></span><span class=SpellE><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>Libin</span></span><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>
Zhou (Distance Oracles for dynamic query constraints)<o:p></o:p></span></p>

<p class=MsoListParagraphCxSpLast style='text-indent:-.25in;mso-list:l0 level1 lfo4;
vertical-align:baseline'><![if !supportLists]><span style='font-family:"Times New Roman",serif;
mso-ascii-theme-font:major-bidi;mso-fareast-font-family:"Times New Roman";
mso-fareast-theme-font:major-bidi;mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:
major-bidi;color:black'><span style='mso-list:Ignore'>7.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span></span><![endif]><span dir=LTR></span><span class=SpellE><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'>Yeasir</span></span><span
style='font-family:"Times New Roman",serif;mso-ascii-theme-font:major-bidi;
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi;color:black'> <span
class=SpellE>Rayhan</span> (Learned spatial data partitioning and vectorized
spatial query processing).<o:p></o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'>Undergraduate Research
Opportunities: In the context of this project, Walid has offered research
opportunities during Summer and Fall 2020 for undergraduate students. Most
notably is Undergraduate Student Hao Wu who was interested in the topic of
ML-based Learned Multidimensional Data Indexing. His research in the topic
materialized into a co-authored tutorial in the ACM SIGSPATIAL 2020 Conference,
where co-authors Hao Wu and Graduate Student Abdullah Al-Mamun participated in
the presentation of the tutorial at the conference. A survey article on the
topic is currently underway.<o:p></o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><b><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black'><o:p>&nbsp;</o:p></span></b></p>

<p class=MsoNormal><a name=Y21><b><span style='font-family:"Times New Roman",serif;
mso-ascii-theme-font:major-bidi;mso-fareast-font-family:"Times New Roman";
mso-hansi-theme-font:major-bidi;mso-bidi-theme-font:major-bidi'>2021-2022
Project Activities<o:p></o:p></span></b></a></p>

<span style='mso-bookmark:Y21'></span>

<p class=MsoNormal><span style='font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'><o:p>&nbsp;</o:p></span></p>

<p class=Default><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'>In 2021/2022, the final year of the project, we
investigated supporting data analytics over fast arriving&nbsp;spatial data
streams. We&nbsp;developed STAR,&nbsp;a distributed in-memory data stream
warehouse system, that provides low-latency and up-to-date analytical results
over a fast-arriving spatial data stream. STAR was published in the 2021 ACM
SIGSPATIAL Conference and was selected as one of the best papers in the
Conference, and was invited in an extended form for journal publication, and
was accepted in the ACM Transactions in Spatial Algorithms and Systems. We
developed&nbsp;<i>Guard</i>, a component that detects and blocks attacks that
target the adaptive load balancing of distributed streaming systems. Guard uses
an unsupervised machine-learning technique to detect malicious users that are
involved in the attack. Guard was published in the IEEE Transactions on
Dependable and Secure Computing. We investigated the presence of
non-deterministic performance and “waves of misery” in update-intensive
workloads over several R-tree variants, and studied how to mitigate this issue.
This research was published in Proceedings of the VLDB 2022. We studied learned
multi-dimensional indexes in the context of an instance-optimized R-tree that
was published in the IEEE Mobile Data Management Conference 2022. We envisioned
how to design location data systems that have location as first-class data type
and not as an afterthought. Finally, we studied the impact of new hardware
architectures on the design of database systems and separating memory from
compute in a disaggregated setup would impact database system techniques. Our
vision paper was published in the Proceedings of the VLDB 2022.<o:p></o:p></span></p>

<p class=Default><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='vertical-align:baseline'><span style='font-family:
"Times New Roman",serif;mso-ascii-theme-font:major-bidi;mso-hansi-theme-font:
major-bidi;mso-bidi-theme-font:major-bidi;color:black;border:none windowtext 1.0pt;
mso-border-alt:none windowtext 0in;padding:0in'>Below, we highlight each of
these contributions and other project’s research, education, and training
activities.<o:p></o:p></span></p>

<p class=Default><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'><o:p>&nbsp;</o:p></span></p>

<p class=Default><b><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/sigspatial2021.pdf">STAR: A
Cache-based Stream Warehouse System for Spatial Data [SIGSPATIAL'2021]</a>, <a
href="https://www.cs.purdue.edu/homes/aref/IDAS/tsas2023.pdf">[ACM TSAS 2023]</a>
</span></b><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'>The proliferation of mobile phones and
location-based services has given rise to an explosive growth in spatial data.
In order to enable spatial data analytics, spatial data needs to be streamed
into a data stream warehouse system that can provide real-time analytical
results over the most recent and historical spatial data in the warehouse.
Existing data stream warehouse systems are not tailored for spatial data. In
this paper, we introduce the&nbsp;STAR&nbsp;system.&nbsp;STAR&nbsp;is a
distributed in-memory data stream warehouse system that provides low-latency
and up-to-date analytical results over a fast-arriving spatial data
stream.&nbsp;STAR&nbsp;supports both snapshot and continuous queries that are
composed of aggregate functions and ad hoc query constraints over spatial,
textual, and temporal data attributes.&nbsp;STAR&nbsp;implements a cache-based
mechanism to facilitate the processing of snapshot queries that collectively
utilizes the techniques of query-based caching (i.e., view materialization) and
object-based caching. Moreover, to speed-up processing continuous
queries,&nbsp;STAR&nbsp;proposes a novel index structure that achieves high
efficiency in both object checking and result updating. Extensive experiments
over real data sets demonstrate the superior performance of&nbsp;STAR&nbsp;over
existing systems.<b><o:p></o:p></b></span></p>

<p class=Default><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'><o:p>&nbsp;</o:p></span></p>

<p class=Default><b><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/tdsc2021.pdf">Guard:
Attack-Resilient Adaptive Load Balancing in Distributed Streaming Systems [IEEE
TDSC 2021]</a></span></b><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'> The performance of distributed streaming systems
relies on how even the workload is distributed among their machines. However,
data and query workloads are skewed and change rapidly. Therefore, multiple
adaptive load-balancing mechanisms have been proposed in the literature to
rebalance distributed streaming systems according to the changes in their
workloads. This paper introduces a novel attack model that targets adaptive
load-balancing mechanisms of distributed streaming systems. The attack reduces
the throughput and the availability of the system by making it stay in a
continuous state of rebalancing. This paper proposes Guard, a component that
detects and blocks attacks that target the adaptive load balancing of
distributed streaming systems. Guard uses an unsupervised machine-learning
technique to detect malicious users that are involved in the attack. Guard does
not block any user unless it detects that the user is malicious. Guard does not
depend on a specific application. Experimental evaluation for a high-intensity
attack illustrates that Guard improves the throughput and the availability of
the system by 85% and 86%, respectively. Moreover, Guard improves the minimum
availability that the attacker achieves by 325%. <o:p></o:p></span></p>

<p class=Default><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'><o:p>&nbsp;</o:p></span></p>

<p class=Default><b><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/vldb2021.pdf">An Experimental
Evaluation and Investigation of Waves of Misery in R-trees [VLDB 2021]</a> </span></b><span
style='font-size:11.0pt;font-family:"Times New Roman",serif;mso-bidi-font-family:
Arial'>Waves of misery is a phenomenon where spikes of many node splits occur
over short periods of time in tree indexes. Waves of misery negatively affect
the performance of tree indexes in insertion-heavy workloads. Waves of misery
have been first observed in the context of the B-tree, where these waves cause
unpredictable index performance. In particular, the performance of search and
index-update operations deteriorate when a wave of misery takes place, but is
more predictable between the waves. This paper investigates the presence or
lack of waves of misery in several R-tree variants, and studies the extent of
which these waves impact the performance of each variant. Interestingly,
although having poorer query performance, the Linear and Quadratic R-trees are
found to be more resilient to waves of misery than both the Hilbert and
R*-trees. This paper presents several techniques to reduce the impact in
performance of the waves of misery for the Hilbert and R*-trees. One way to
eliminate waves of misery is to force node splits to take place at regular
times before nodes become full to achieve deterministic performance. The other
way is that upon splitting a node, do not split it evenly but rather at
different node utilization factors. This allows leaf nodes not to fill at the
same pace. We study the impact of two new techniques to mitigate waves of
misery after the tree index has been constructed, namely Regular Elective
Splits (RES, for short) and Unequal Random Splits (URS, for short). Our
experimental investigation highlights the trade-offs in performance of the
introduced techniques and the pros and cons of each technique.<b><o:p></o:p></b></span></p>

<p class=Default><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'><o:p>&nbsp;</o:p></span></p>

<p class=Default><b><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/mdm2022.pdf">The “AI+R”-tree:
An Instance-optimized R-tree [MDM 2022]</a> </span></b><span style='font-size:
11.0pt;font-family:"Times New Roman",serif;mso-bidi-font-family:Arial'>The
emerging class of instance-optimized systems has shown potential to achieve
high performance by specializing to a specific data and query workloads.
Particularly, Machine Learning (ML) techniques have been applied successfully
to build various instance-optimized components (e.g., learned indexes). This
paper investigates to leverage ML techniques to enhance the performance of
spatial indexes, particularly the R-tree, for a given data and query workloads.
As the areas covered by the R-tree index nodes overlap in space, upon searching
for a specific point in space, multiple paths from root to leaf may potentially
be explored. In the worst case, the entire R-tree could be searched. In this
paper, we define and use the overlap ratio to quantify the de- <span
class=SpellE>gree</span> of extraneous leaf node accesses required by a range
query. The goal is to enhance the query performance of a traditional R-tree for
high-overlap range queries as they tend to incur long running-times. We
introduce a new AI-tree that transforms the search operation of an R-tree into
a multi-label classification task to exclude the extraneous leaf node accesses.
Then, we augment a traditional R-tree to the AI-tree to form a hybrid “AI+R”-
tree. The “AI+R”-tree can automatically differentiate between the high- and
low-overlap queries using a learned model. Thus, the “AI+R”-tree processes
high-overlap queries using the AI- tree, and the low-overlap queries using the
R-tree. Experiments on real datasets demonstrate that the “AI+R”-tree can
enhance the query performance over a traditional R-tree by up to 500%. <b><o:p></o:p></b></span></p>

<p class=Default><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'><o:p>&nbsp;</o:p></span></p>

<p class=Default><b><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/vldb2022.pdf">The Case for
Distributed Shared-Memory Databases with RDMA-Enabled Memory Disaggregation [VLDB’22]</a>
</span></b><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'>Memory disaggregation (MD) allows for scalable and
elastic data center design by separating compute (CPU) from memory. With MD,
compute and memory are no longer coupled into the same server box. Instead,
they are connected to each other via ultra-fast networking such as RDMA. MD can
bring many advantages, e.g., higher memory utilization, better independent
scaling (of compute and memory), and lower cost of ownership. This paper makes
the case that MD can fuel the next wave of innovation on database systems. We
observe that MD revives the great debate of &quot;shared what&quot; in the
database community. We envision that distributed shared- memory databases
(DSM-DB, for short) – that have not received much attention before – can be
promising in the future with MD. We present a list of challenges and
opportunities that can inspire next steps in system design making the case for
DSM-DB. <o:p></o:p></span></p>

<p class=Default><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'><o:p>&nbsp;</o:p></span></p>

<p class=Default><b><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'><a
href="https://www.cs.purdue.edu/homes/aref/IDAS/ilx2022.pdf">ILX: Intelligent
&quot;<span class=SpellE>Location+X</span>&quot; Data Systems (Vision Paper)</a>
</span></b><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'>Due to the ubiquity of mobile phones and
location-detection devices, location data is being generated in very large
volumes. Queries and operations that are performed on location data warrant the
use of database systems. Despite that, location data is being supported in data
systems as an afterthought. Typically, relational or NoSQL data systems that
are mostly designed with non-location data in mind get extended with spatial or
spatiotemporal indexes, some query op- <span class=SpellE>erators</span>, and <span
class=GramE>higher level</span> syntactic sugar in order to support location
data. The ubiquity of location data and location data services call for systems
that are solely designed and optimized for the efficient support of location
data. This paper envisions designing intelligent <span class=SpellE>location+X</span>
data systems, ILX for short, where location is treated as a first-class citizen
type. ILX is tailored with location data as the main data type
(location-first). Because location data is typically augmented with other data
types X, e.g., graphs, text data, click streams, annotations, etc., ILX needs
to be extensible to support other data types X along with location. This paper
envisions the main features that ILX should support, and highlights research
challenges in realizing and supporting ILX. <o:p></o:p></span></p>

<p class=Default><b><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'><o:p>&nbsp;</o:p></span></b></p>

<p class=Default><b><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'>Training and Professional Development<o:p></o:p></span></b></p>

<p class=Default><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'><o:p>&nbsp;</o:p></span></p>

<p class=Default><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'>During the 2021/2022 academic year, Walid has
offered several research training opportunities for graduate students as
graduate-level PhD research and independent study courses that involve various
project-related topics, where several students got training on presenting and
discussing research papers and in conducting a semester-long project. These
students include <o:p></o:p></span></p>

<p class=Default style='margin-left:.5in;text-indent:-.25in;mso-list:l2 level1 lfo5'><![if !supportLists]><span
style='font-size:11.0pt;font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'><span style='mso-list:Ignore'>1.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span></span><![endif]><span dir=LTR></span><span class=SpellE><span
style='font-size:11.0pt;font-family:"Times New Roman",serif;mso-bidi-font-family:
Arial'>Jaewoo</span></span><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'> Shin (Concurrency Control for Update-tolerant
LSM-based Spatial and B-tee Indexing – resulted in a journal paper submission)<o:p></o:p></span></p>

<p class=Default style='margin-left:.5in;text-indent:-.25in;mso-list:l2 level1 lfo5'><![if !supportLists]><span
style='font-size:11.0pt;font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'><span style='mso-list:Ignore'>2.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span></span><![endif]><span dir=LTR></span><span style='font-size:
11.0pt;font-family:"Times New Roman",serif;mso-bidi-font-family:Arial'>Abdullah
Al Mamun (Learned R-tree Spatial Indexing – resulted in an MDM’22 conference
paper)<o:p></o:p></span></p>

<p class=Default style='margin-left:.5in;text-indent:-.25in;mso-list:l2 level1 lfo5'><![if !supportLists]><span
style='font-size:11.0pt;font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'><span style='mso-list:Ignore'>3.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span></span><![endif]><span dir=LTR></span><span style='font-size:
11.0pt;font-family:"Times New Roman",serif;mso-bidi-font-family:Arial'>Lu Xing
(two projects: Waves of Misery in R-trees – resulted in a VLDB’21 conference
paper, and adaptive tree indexing)<o:p></o:p></span></p>

<p class=Default style='margin-left:.5in;text-indent:-.25in;mso-list:l2 level1 lfo5'><![if !supportLists]><span
style='font-size:11.0pt;font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'><span style='mso-list:Ignore'>4.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span></span><![endif]><span dir=LTR></span><span class=SpellE><span
style='font-size:11.0pt;font-family:"Times New Roman",serif;mso-bidi-font-family:
Arial'>Ruihong</span></span><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'> Wang (RDMA-based Big Data Systems – resulted in a
VLDB’22 vision paper)<o:p></o:p></span></p>

<p class=Default style='margin-left:.5in;text-indent:-.25in;mso-list:l2 level1 lfo5'><![if !supportLists]><span
style='font-size:11.0pt;font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'><span style='mso-list:Ignore'>5.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span></span><![endif]><span dir=LTR></span><span class=SpellE><span
style='font-size:11.0pt;font-family:"Times New Roman",serif;mso-bidi-font-family:
Arial'>Libin</span></span><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'> Zhou (two projects: Lock-free Concurrency Control
for Graph Systems – resulted in a conference paper submission, and Distance
Oracles for dynamic query constraints)<o:p></o:p></span></p>

<p class=Default style='margin-left:.5in;text-indent:-.25in;mso-list:l2 level1 lfo5'><![if !supportLists]><span
style='font-size:11.0pt;font-family:"Times New Roman",serif;mso-fareast-font-family:
"Times New Roman"'><span style='mso-list:Ignore'>6.<span style='font:7.0pt "Times New Roman"'>&nbsp;&nbsp;&nbsp;&nbsp;
</span></span></span><![endif]><span dir=LTR></span><span class=SpellE><span
style='font-size:11.0pt;font-family:"Times New Roman",serif;mso-bidi-font-family:
Arial'>Yeasir</span></span><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'> <span class=SpellE>Rayhan</span> (SIMD-aware
R-tree index – resulted in a conference paper submission).<o:p></o:p></span></p>

<p class=Default><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'><o:p>&nbsp;</o:p></span></p>

<p class=Default><span style='font-size:11.0pt;font-family:"Times New Roman",serif;
mso-bidi-font-family:Arial'>*</span> <span style='font-size:10.0pt'>Disclaimer:
<i>Any opinions, findings, and conclusions or recommendations expressed in this
material are those of the author(s) and do not necessarily reflect the views of
the National Science Foundation.</i></span></p>

<p class=MsoNormal><o:p>&nbsp;</o:p></p>

<p class=MsoNormal><span style='font-size:10.0pt'>Date of Last Update: December
10, 2023</span></p>

<p class=MsoNormal style='margin-left:.25in'><span style='font-family:"Times New Roman",serif;
mso-fareast-font-family:"Times New Roman"'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='margin-left:.25in'><span style='font-family:"Times New Roman",serif;
mso-fareast-font-family:"Times New Roman"'><o:p>&nbsp;</o:p></span></p>

<p class=MsoNormal style='margin-left:.25in'><span style='font-family:"Times New Roman",serif;
mso-fareast-font-family:"Times New Roman"'><o:p>&nbsp;</o:p></span></p>

</div>

</body>

</html>