<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	xmlns:georss="http://www.georss.org/georss" xmlns:geo="http://www.w3.org/2003/01/geo/wgs84_pos#" xmlns:media="http://search.yahoo.com/mrss/"
	>

<channel>
	<title>Human Language Technology Center of Excellence</title>
	<atom:link href="http://hltcoe.jhu.edu/feed/" rel="self" type="application/rss+xml" />
	<link>http://hltcoe.jhu.edu</link>
	<description></description>
	<lastBuildDate>Fri, 06 Apr 2012 18:26:46 +0000</lastBuildDate>
	<language>en</language>
	<sy:updatePeriod>hourly</sy:updatePeriod>
	<sy:updateFrequency>1</sy:updateFrequency>
	<generator>http://wordpress.com/</generator>
<cloud domain='hltcoe.jhu.edu' port='80' path='/?rsscloud=notify' registerProcedure='' protocol='http-post' />
<image>
		<url>http://s2.wp.com/i/buttonw-com.png</url>
		<title>Human Language Technology Center of Excellence</title>
		<link>http://hltcoe.jhu.edu</link>
	</image>
	<atom:link rel="search" type="application/opensearchdescription+xml" href="http://hltcoe.jhu.edu/osd.xml" title="Human Language Technology Center of Excellence" />
	<atom:link rel='hub' href='http://hltcoe.jhu.edu/?pushpress=hub'/>
		<item>
		<title>April 3, 2012: Technical Exchange</title>
		<link>http://hltcoe.jhu.edu/2012/04/06/403/</link>
		<comments>http://hltcoe.jhu.edu/2012/04/06/403/#comments</comments>
		<pubDate>Fri, 06 Apr 2012 15:54:27 +0000</pubDate>
		<dc:creator>kdaught2</dc:creator>
				<category><![CDATA[Technical Meetings]]></category>

		<guid isPermaLink="false">http://hltcoe.jhu.edu/?p=403</guid>
		<description><![CDATA[These talks are part of our bi-annual seminar presenting an array of current research projects at the HLTCOE. Machine Translation of Arabic Dialects Chris Callison-Burch Translating Low Resource Indic languages Matt Post Preparations for Cross-Lingual Speech Retrieval without Recognition or Translation Adam Lopez Compression Models for Language and Dialect Identification Paul McNamee Building Resources for [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=hltcoe.jhu.edu&amp;blog=26761117&amp;post=403&amp;subd=hltcoe&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>These talks are part of our bi-annual seminar presenting an array of current research projects at the HLTCOE.</p>
<p><strong>Machine Translation of Arabic Dialects</strong><br />
Chris Callison-Burch</p>
<p><strong>Translating Low Resource Indic languages</strong><br />
Matt Post</p>
<p><strong>Preparations for Cross-Lingual Speech Retrieval without Recognition or Translation<br />
</strong>Adam Lopez</p>
<p><strong><strong>Compression Models for Language and Dialect Identification<br />
</strong></strong>Paul McNamee</p>
<p><strong><strong>Building Resources for Multi-lingual Sentiment Analysis<br />
</strong></strong>Theresa Wilson</p>
<p><strong><strong>Stylometric Analysis of Scientific Articles<br />
</strong></strong>Shane Bergsma</p>
<p><strong><strong>Social Power and Its Expression in Written Dialog<br />
</strong></strong>Owen Rambo</p>
<p><strong>What Good is Bad ASR?<br />
</strong>Mark Dredze <strong></strong></p>
<p><strong><br />
</strong></p>
<p><strong><br />
</strong></p>
<p><strong><br />
</strong></p>
<p><strong><br />
</strong></p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/hltcoe.wordpress.com/403/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/hltcoe.wordpress.com/403/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/hltcoe.wordpress.com/403/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/hltcoe.wordpress.com/403/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/hltcoe.wordpress.com/403/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/hltcoe.wordpress.com/403/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/hltcoe.wordpress.com/403/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/hltcoe.wordpress.com/403/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/hltcoe.wordpress.com/403/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/hltcoe.wordpress.com/403/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/hltcoe.wordpress.com/403/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/hltcoe.wordpress.com/403/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/hltcoe.wordpress.com/403/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/hltcoe.wordpress.com/403/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=hltcoe.jhu.edu&amp;blog=26761117&amp;post=403&amp;subd=hltcoe&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://hltcoe.jhu.edu/2012/04/06/403/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/308742bc09c1585d68805c9dd233753e?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">kdaught2</media:title>
		</media:content>
	</item>
		<item>
		<title>April 11, 2012, Peter Clark, Project Halo: Towards a Knowledgeable Biology Textbook</title>
		<link>http://hltcoe.jhu.edu/2012/04/02/april-11-2012-peter-clark-project-halo-towards-a-knowledgeable-biology-textbook/</link>
		<comments>http://hltcoe.jhu.edu/2012/04/02/april-11-2012-peter-clark-project-halo-towards-a-knowledgeable-biology-textbook/#comments</comments>
		<pubDate>Mon, 02 Apr 2012 18:54:48 +0000</pubDate>
		<dc:creator>kdaught2</dc:creator>
				<category><![CDATA[Talks]]></category>

		<guid isPermaLink="false">http://hltcoe.jhu.edu/?p=393</guid>
		<description><![CDATA[Peter Clark, Vulcan Inc. Project Halo: Towards a Knowledgeable Biology Textbook As part of Project Halo at Vulcan Inc, we are creating an (iPadhosted) &#8220;knowledgeable biology textbook&#8221;, called Inquire. Inquire allows the user to not only read and browse the textbook, but also to ask questions and get reasoned or retrieved answers back, explore the [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=hltcoe.jhu.edu&amp;blog=26761117&amp;post=393&amp;subd=hltcoe&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>Peter Clark, Vulcan Inc.</p>
<p>Project Halo: Towards a Knowledgeable Biology Textbook</p>
<p>As part of Project Halo at Vulcan Inc, we are creating an (iPadhosted) &#8220;knowledgeable biology textbook&#8221;, called Inquire. Inquire allows the user to not only read and browse the textbook, but also to ask questions and get reasoned or retrieved answers back, explore the material through semantic connections, and receive suggestions of useful questions to ask. While the core of Inquire is a formal, hand-crafted knowledge base encoding some of the book&#8217;s content, this year we are extending Inquire with capabilities for question-answering directly from the book text itself, integrating technologies for natural language processing, textual entailment, and paraphrasing (including paraphrasing technology from Johns Hopkins), and exploring the extent to which the system can &#8220;reason&#8221; with biology knowledge directly at the textual level. In this talk I will overview the project, and then describe the textual question-answering component in detail, in particular how the various NLP technologies are being integrated. I will also discuss the interplay being developed between the hand-built knowledge and automatic text-extracted knowledge, and how each can potentially support the other, with the formal knowledge providing inference support for textual reasoning and the text-extracted knowledge being a potential source of new material for the formal knowledge-base.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/hltcoe.wordpress.com/393/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/hltcoe.wordpress.com/393/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/hltcoe.wordpress.com/393/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/hltcoe.wordpress.com/393/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/hltcoe.wordpress.com/393/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/hltcoe.wordpress.com/393/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/hltcoe.wordpress.com/393/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/hltcoe.wordpress.com/393/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/hltcoe.wordpress.com/393/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/hltcoe.wordpress.com/393/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/hltcoe.wordpress.com/393/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/hltcoe.wordpress.com/393/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/hltcoe.wordpress.com/393/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/hltcoe.wordpress.com/393/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=hltcoe.jhu.edu&amp;blog=26761117&amp;post=393&amp;subd=hltcoe&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://hltcoe.jhu.edu/2012/04/02/april-11-2012-peter-clark-project-halo-towards-a-knowledgeable-biology-textbook/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/308742bc09c1585d68805c9dd233753e?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">kdaught2</media:title>
		</media:content>
	</item>
		<item>
		<title>March 26, 2012, Gregory Sell, “Acoustic Cues for Perceptual Speaker Recognition”</title>
		<link>http://hltcoe.jhu.edu/2012/03/19/march-26-2012-dr-gregory-sell-acoustic-cues-for-perceptual-speaker-recognition/</link>
		<comments>http://hltcoe.jhu.edu/2012/03/19/march-26-2012-dr-gregory-sell-acoustic-cues-for-perceptual-speaker-recognition/#comments</comments>
		<pubDate>Mon, 19 Mar 2012 18:40:53 +0000</pubDate>
		<dc:creator>kdaught2</dc:creator>
				<category><![CDATA[Talks]]></category>

		<guid isPermaLink="false">http://hltcoe.jhu.edu/?p=384</guid>
		<description><![CDATA[Gregory Sell, University of Maryland, College Park “Acoustic Cues for Perceptual Speaker Recognition” While much research has been devoted to the conditional performance of human listeners in speaker recognition tasks, determining how these decisions are made has received less attention.  Automatic speaker recognition has received even more attention from researchers, but progress in this field [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=hltcoe.jhu.edu&amp;blog=26761117&amp;post=384&amp;subd=hltcoe&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>Gregory Sell, University of Maryland, College Park</p>
<p style="text-align:left;" align="center">“Acoustic Cues for Perceptual Speaker Recognition”</p>
<p>While much research has been devoted to the conditional performance of human listeners in speaker recognition tasks, determining how these decisions are made has received less attention.  Automatic speaker recognition has received even more attention from researchers, but progress in this field has focused more on improvements in machine learning rather than increasing perceptual understanding.  In this talk, I will discuss our recent research intended to shine a light on some of these unexplored, fundamental aspects of perceptual speaker recognition.  The conversation will focus around preliminary results from perceptual experiments designed to isolate the effects of individual acoustic cues on human subject performance by using morphed stimuli with those acoustic parameters normalized across all voices.  In the course of this discussion, I will also present previous research on audio database organization with diffusion maps as well as convex demodulation, an algorithm for decomposing an audio signal into its modulator and carrier components within a convex optimization framework.</p>
<p>Bio: Dr. Gregory Sell received his B.A. in Music, Science and Technology in 2005 from Stanford University.  He then stayed on at the school to complete an M.S. in Electrical Engineering (2007) and a Ph.D. in Computer-based Music Theory and Acoustics (2010) as well.  His dissertation work organized audio and musical elements using diffusion mapping, a non-linear mathematical analysis algorithm.  In his time at Stanford, he also developed convex demodulation, a framework for extracting modulators from arbitrary acoustic carriers.  His other research interests include human auditory perception, music information retrieval, and data sonification. He is now an Intelligence Community Postdoctoral Fellow at the University of Maryland, College Park, in the Institute for Systems Research, where he is conducting perceptual experiments to analyze the acoustic cues of speaker recognition.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/hltcoe.wordpress.com/384/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/hltcoe.wordpress.com/384/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/hltcoe.wordpress.com/384/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/hltcoe.wordpress.com/384/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/hltcoe.wordpress.com/384/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/hltcoe.wordpress.com/384/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/hltcoe.wordpress.com/384/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/hltcoe.wordpress.com/384/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/hltcoe.wordpress.com/384/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/hltcoe.wordpress.com/384/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/hltcoe.wordpress.com/384/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/hltcoe.wordpress.com/384/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/hltcoe.wordpress.com/384/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/hltcoe.wordpress.com/384/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=hltcoe.jhu.edu&amp;blog=26761117&amp;post=384&amp;subd=hltcoe&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://hltcoe.jhu.edu/2012/03/19/march-26-2012-dr-gregory-sell-acoustic-cues-for-perceptual-speaker-recognition/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/308742bc09c1585d68805c9dd233753e?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">kdaught2</media:title>
		</media:content>
	</item>
		<item>
		<title>March 16, 2012, John Piorkowski, &#8220;Trust in Online Communities&#8221;,</title>
		<link>http://hltcoe.jhu.edu/2012/03/14/march-16-2012-john-piorkowski-trust-in-online-communities/</link>
		<comments>http://hltcoe.jhu.edu/2012/03/14/march-16-2012-john-piorkowski-trust-in-online-communities/#comments</comments>
		<pubDate>Wed, 14 Mar 2012 20:53:26 +0000</pubDate>
		<dc:creator>kdaught2</dc:creator>
				<category><![CDATA[Talks]]></category>

		<guid isPermaLink="false">http://hltcoe.jhu.edu/?p=380</guid>
		<description><![CDATA[John Piorkowski, UMBC and JHU/APL &#8220;Trust in Online Communities&#8221; The scope of this research addresses the role of interpersonal trust between individuals in online communities. Several streams of research to include organizational trust models, trust in virtual settings, speech act theory, identity theory, common bond theory, natural language processing are leveraged to create a novel [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=hltcoe.jhu.edu&amp;blog=26761117&amp;post=380&amp;subd=hltcoe&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>John Piorkowski, UMBC and JHU/APL</p>
<p>&#8220;Trust in Online Communities&#8221;</p>
<p>The scope of this research addresses the role of interpersonal trust between individuals in online communities. Several streams of research to include organizational trust models, trust in virtual settings, speech act theory, identity theory, common bond theory, natural language processing are leveraged to create a novel trust model that is used to determine antecedents for trust and new algorithms for automatic detection of trust in online communities. Online communities continue to grow in the internet and vary from grass roots organizations to communities facilitated by large corporations. Examples of increased use of social networks include seeking health and financial advice. Topics such as these stress the importance of trust between individuals in online communities. Although trust has been widely studied in the literature, the question of how trust evolves in online communities remains as a<br />
research gap. Online communities continue to grow and involve the daily exchange between individuals with no face-to-face interaction. This research aims to model the evolution of trust in online communities leading to the creation of new tools to assist online community managers in moderating communities.</p>
<p>A trust model based on organizational research is defined and tested via an empirical study using a financial investing community. These results are used to create a formal model using social exchange and speech act theories. With a formal model, speech act profiling using N-gram language models and a Hidden Markov Model classifier is investigated for automating the discovery of interpersonal trust relationships.</p>
<p>Bio:<br />
John Piorkowski is PhD student in Information Systems at University of Maryland Baltimore County who is examining trust in online communities.<br />
His research focuses on trust in virtual settings, speech act and identity theories, and natural language processing. In addition, John serves as the<br />
Chief Engineer in the Asymmetric Operations Department at the Johns Hopkins University Applied Physics Laboratory.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/hltcoe.wordpress.com/380/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/hltcoe.wordpress.com/380/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/hltcoe.wordpress.com/380/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/hltcoe.wordpress.com/380/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/hltcoe.wordpress.com/380/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/hltcoe.wordpress.com/380/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/hltcoe.wordpress.com/380/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/hltcoe.wordpress.com/380/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/hltcoe.wordpress.com/380/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/hltcoe.wordpress.com/380/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/hltcoe.wordpress.com/380/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/hltcoe.wordpress.com/380/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/hltcoe.wordpress.com/380/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/hltcoe.wordpress.com/380/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=hltcoe.jhu.edu&amp;blog=26761117&amp;post=380&amp;subd=hltcoe&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://hltcoe.jhu.edu/2012/03/14/march-16-2012-john-piorkowski-trust-in-online-communities/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/308742bc09c1585d68805c9dd233753e?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">kdaught2</media:title>
		</media:content>
	</item>
		<item>
		<title>March 19, 2012, Daniel Garcia-Romero, “Automatic Speaker Recognition: 8x improvement in 10 years! Nothing that a 6dB SNR cannot undo&#8221;</title>
		<link>http://hltcoe.jhu.edu/2012/03/07/march-19-2012-daniel-garcia-romero-automatic-speaker-recognition-8x-improvement-in-10-years-nothing-that-a-6db-snr-cannot-undo/</link>
		<comments>http://hltcoe.jhu.edu/2012/03/07/march-19-2012-daniel-garcia-romero-automatic-speaker-recognition-8x-improvement-in-10-years-nothing-that-a-6db-snr-cannot-undo/#comments</comments>
		<pubDate>Wed, 07 Mar 2012 16:56:11 +0000</pubDate>
		<dc:creator>kdaught2</dc:creator>
				<category><![CDATA[Talks]]></category>

		<guid isPermaLink="false">http://hltcoe.jhu.edu/?p=377</guid>
		<description><![CDATA[Daniel Garcia-Romero, University of Maryland &#8220;Automatic Speaker Recognition: 8x improvement in 10 years! Nothing that a 6dB SNR cannot undo&#8221; Automatic speaker recognition in uncontrolled environments is a very challenging task due to channel distortions, additive noise and reverberation. To address these issues, speaker recognition systems have evolved from a simple Gaussian Mixture Model architecture [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=hltcoe.jhu.edu&amp;blog=26761117&amp;post=377&amp;subd=hltcoe&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>Daniel Garcia-Romero, University of Maryland</p>
<p>&#8220;Automatic Speaker Recognition: 8x improvement in 10 years! Nothing that a 6dB SNR cannot undo&#8221;</p>
<p>Automatic speaker recognition in uncontrolled environments is a very challenging task due to channel distortions, additive noise and reverberation. To address these issues, speaker recognition systems have evolved from a simple Gaussian Mixture Model architecture to the current state-of-the-art based on i-vector representations. This has led to an 8x performance improvement measured by the latest NIST evaluation data.</p>
<p>In the first part of the talk, I will present an overview of how the systems have evolved over the past ten years and emphasize two important contributions from my work. Namely, the reformulation of Joint Factor Analysis in terms of over complete dictionaries, and the transformation of i-vectors by length normalization. The first contribution results in computational savings and ease of explanation. The second one has impacted the direction followed by the speaker recognition community due to its high performance and analytical tractability.</p>
<p>In the second part, I will analyze the performance degradation of an i-vector system in the presence of additive noise and propose a robust architecture. In particular, I will explore the use of multi-condition training in a multi-classifier setup. This architecture produces excellent results in anticipated conditions and generalizes well to unseen conditions.</p>
<p>Bio:<br />
Daniel Garcia-Romero is a PhD candidate in the Electrical Engineering Department at the University of Maryland, College Park. His research interests are in the broad areas of speech forensics and machine learning. Most of his contributions are in automatic speaker recognition where he has developed systems to participate in 5 NIST evaluations. He has received the best student paper award at the 159<sup>th</sup> meeting of the Acoustical Society of America (2010), and the best poster award at the 4<sup>th</sup> International Conference on Audio- and Video-Based Biometric Person Authentication, AVBPA (2003).</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/hltcoe.wordpress.com/377/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/hltcoe.wordpress.com/377/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/hltcoe.wordpress.com/377/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/hltcoe.wordpress.com/377/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/hltcoe.wordpress.com/377/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/hltcoe.wordpress.com/377/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/hltcoe.wordpress.com/377/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/hltcoe.wordpress.com/377/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/hltcoe.wordpress.com/377/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/hltcoe.wordpress.com/377/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/hltcoe.wordpress.com/377/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/hltcoe.wordpress.com/377/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/hltcoe.wordpress.com/377/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/hltcoe.wordpress.com/377/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=hltcoe.jhu.edu&amp;blog=26761117&amp;post=377&amp;subd=hltcoe&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://hltcoe.jhu.edu/2012/03/07/march-19-2012-daniel-garcia-romero-automatic-speaker-recognition-8x-improvement-in-10-years-nothing-that-a-6db-snr-cannot-undo/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/308742bc09c1585d68805c9dd233753e?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">kdaught2</media:title>
		</media:content>
	</item>
		<item>
		<title>March 12, 2012: Matt Post, “Syntactic features for text classification”</title>
		<link>http://hltcoe.jhu.edu/2012/03/07/march-12-2012-matt-post-syntactic-features-for-text-classification/</link>
		<comments>http://hltcoe.jhu.edu/2012/03/07/march-12-2012-matt-post-syntactic-features-for-text-classification/#comments</comments>
		<pubDate>Wed, 07 Mar 2012 16:30:24 +0000</pubDate>
		<dc:creator>kdaught2</dc:creator>
				<category><![CDATA[Talks]]></category>

		<guid isPermaLink="false">http://hltcoe.jhu.edu/?p=375</guid>
		<description><![CDATA[Matt Post,  Johns Hopkins, Human Language Technology Center of Excellence Language models that model phenomena beyond the narrow window of words used by n-gram models have a long history in natural language processing, but relatively little success.  The reasons for these failures are not perfectly understood, but are related to difficult tradeoffs between expressiveness, the [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=hltcoe.jhu.edu&amp;blog=26761117&amp;post=375&amp;subd=hltcoe&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>Matt Post,  Johns Hopkins, Human Language Technology Center of Excellence</p>
<p>Language models that model phenomena beyond the narrow window of words used by n-gram models have a long history in natural language processing, but relatively little success.  The reasons for these failures are not perfectly understood, but are related to difficult tradeoffs between expressiveness, the computational complexity of inference, and the typical setting which integrates language models into the search process of the generation task, where their role is to make fine-grained discriminations among similar hypotheses.  At the same time, the kind of knowledge contained in such models seems necessary to address the severe ungrammaticality of the output of many natural language generation tasks, such as speech recognition and machine translation.</p>
<p>In light of these difficulties, we take a step back from integrated approaches to focus on coarser discriminative tasks.  We demonstrate the effectiveness of syntactic features, showing state of the art classification results on a range of tasks that increasingly approximate the original machine translation setting.  Of particular note is the consistent effectiveness of out-of-domain tree fragments with an extended domain of locality.  With lessons from these coarser tasks in mind, we end with a proposal for an integrated model of syntax-based language modeling within a string-to-tree machine translation decoder.</p>
<p>BIO:</p>
<p>Matt Post is a postdoctoral researcher at the Human Language Technology Center of Excellence at Johns Hopkins University.  He earned his Ph.D. from the University of Rochester in March of 2011, where he worked with Dan Gildea on machine translation, language modeling, and grammar learning.  His main research interests are in machine translation and text analytics.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/hltcoe.wordpress.com/375/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/hltcoe.wordpress.com/375/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/hltcoe.wordpress.com/375/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/hltcoe.wordpress.com/375/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/hltcoe.wordpress.com/375/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/hltcoe.wordpress.com/375/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/hltcoe.wordpress.com/375/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/hltcoe.wordpress.com/375/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/hltcoe.wordpress.com/375/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/hltcoe.wordpress.com/375/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/hltcoe.wordpress.com/375/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/hltcoe.wordpress.com/375/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/hltcoe.wordpress.com/375/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/hltcoe.wordpress.com/375/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=hltcoe.jhu.edu&amp;blog=26761117&amp;post=375&amp;subd=hltcoe&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://hltcoe.jhu.edu/2012/03/07/march-12-2012-matt-post-syntactic-features-for-text-classification/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/308742bc09c1585d68805c9dd233753e?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">kdaught2</media:title>
		</media:content>
	</item>
		<item>
		<title>March 7, 2012: Matt Hoffman: Variational Bayesian Methods for Unsupervised Latent Factor Models of Text and Audio</title>
		<link>http://hltcoe.jhu.edu/2012/02/22/wednesday-march-7-2012-matt-hoffman-variational-bayesian-methods-for-unsupervised-latent-factor-models-of-text-and-audio/</link>
		<comments>http://hltcoe.jhu.edu/2012/02/22/wednesday-march-7-2012-matt-hoffman-variational-bayesian-methods-for-unsupervised-latent-factor-models-of-text-and-audio/#comments</comments>
		<pubDate>Wed, 22 Feb 2012 15:44:34 +0000</pubDate>
		<dc:creator>kdaught2</dc:creator>
				<category><![CDATA[Talks]]></category>

		<guid isPermaLink="false">http://hltcoe.jhu.edu/?p=364</guid>
		<description><![CDATA[Matt Hoffman, Columbia University Variational Bayesian Methods for Unsupervised Latent Factor Models of Text and Audio In this talk, I will discuss variational strategies for fitting two Bayesian models that explain high-dimensional media data in terms of sets of latent factors. The first model, Latent Dirichlet Allocation (LDA), is a popular model of text corpora [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=hltcoe.jhu.edu&amp;blog=26761117&amp;post=364&amp;subd=hltcoe&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>Matt Hoffman, Columbia University</p>
<p>Variational Bayesian Methods for Unsupervised Latent Factor Models of Text and Audio</p>
<p>In this talk, I will discuss variational strategies for fitting two Bayesian models that explain high-dimensional media data in terms of sets of latent factors.</p>
<p>The first model, Latent Dirichlet Allocation (LDA), is a popular model of text corpora that learns to represent documents as mixtures of latent &#8220;topic&#8221; distributions. We develop an online variational Bayes (VB) algorithm for LDA. Online LDA is based on online stochastic optimization with a natural gradient step, which we show converges to a local optimum of the VB objective function. It can handily analyze massive document collections, including those arriving in a stream. We study the performance of online LDA in several ways, including by fitting a 100-topic topic model to 3.3M articles from Wikipedia in a single pass. We demonstrate that online LDA finds topic models as good as or better than those found with batch VB, and in a fraction of the time.</p>
<p>The second model, Gamma Process Non negative Matrix Factorization (GaP-NMF), is a new Bayesian nonparametric model of audio spectrograms that addresses the problem of latent source discovery and separation in audio recordings. GaP-NMF allows us to discover what sounds (e.g. bass drums, guitar chords, etc.) are present in a recording and to isolate or suppress individual sources. Crucially, this model is able to decide how many latent sources are necessary to model the data. This feature is particularly valuable in this application, since it is impossible to guess a priori how many sounds will appear in a given recording. Although the GaP-NMF model lacks the conditional conjugacy enjoyed by models such as LDA, we are nonetheless able to efficiently fit it to data using a novel variational algorithm.</p>
<p>Bio:</p>
<p>Matthew D. Hoffman is a postdoctoral researcher in the Department of Statistics at Columbia University. He received his Ph.D. in Computer Science from Princeton University in 2010. His research interests are in machine learning, statistical modeling, audio signal processing, content-based music information retrieval, and the associated computational issues.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/hltcoe.wordpress.com/364/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/hltcoe.wordpress.com/364/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/hltcoe.wordpress.com/364/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/hltcoe.wordpress.com/364/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/hltcoe.wordpress.com/364/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/hltcoe.wordpress.com/364/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/hltcoe.wordpress.com/364/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/hltcoe.wordpress.com/364/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/hltcoe.wordpress.com/364/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/hltcoe.wordpress.com/364/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/hltcoe.wordpress.com/364/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/hltcoe.wordpress.com/364/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/hltcoe.wordpress.com/364/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/hltcoe.wordpress.com/364/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=hltcoe.jhu.edu&amp;blog=26761117&amp;post=364&amp;subd=hltcoe&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://hltcoe.jhu.edu/2012/02/22/wednesday-march-7-2012-matt-hoffman-variational-bayesian-methods-for-unsupervised-latent-factor-models-of-text-and-audio/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/308742bc09c1585d68805c9dd233753e?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">kdaught2</media:title>
		</media:content>
	</item>
		<item>
		<title>March 5, 2012: Margaret Mitchell: Generating Descriptions of Visible Objects</title>
		<link>http://hltcoe.jhu.edu/2012/02/21/march-5-2012-margaret-mitchell/</link>
		<comments>http://hltcoe.jhu.edu/2012/02/21/march-5-2012-margaret-mitchell/#comments</comments>
		<pubDate>Tue, 21 Feb 2012 17:19:58 +0000</pubDate>
		<dc:creator>kdaught2</dc:creator>
				<category><![CDATA[Talks]]></category>

		<guid isPermaLink="false">http://hltcoe.jhu.edu/?p=360</guid>
		<description><![CDATA[Margaret Mitchell, University of Aberdeen &#8220;Generating Descriptions of Visible Objects&#8221; Abstract:  What do people describe when they look at objects?  Can we model what they say?  (Why does this matter?)  This talk will characterize what makes up a visual description and define some of the methods necessary to automatically generate such language.  Taking this a [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=hltcoe.jhu.edu&amp;blog=26761117&amp;post=360&amp;subd=hltcoe&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>Margaret Mitchell, University of Aberdeen</p>
<p>&#8220;Generating Descriptions of Visible Objects&#8221;</p>
<p>Abstract:  What do people describe when they look at objects?  Can we model what they say?  (Why does this matter?)  This talk will characterize what makes up a visual description and define some of the methods necessary to automatically generate such language.  Taking this a bit further, I describe an end-to-end prototype system that reads in computer vision output and generates natural language descriptions.  Time permitting, I argue that improving visual descriptions can also improve computer vision, and working on the interaction between the two may lead to advances in both computer vision and natural language generation.  My prototype vision-to-language system, largely developed during the Hopkins summer workshop 2011 in collaboration with vision researchers at Stony Brook and language researchers at U. Maryland, is available at:  <a href="http://recognition.cs.stonybrook.edu:8080/%7Emitchema/midge/">http://recognition.cs.stonybrook.edu:8080/~mitchema/midge/</a></p>
<p>&nbsp;</p>
<p>BIO:</p>
<p>Meg Mitchell graduated with a Bachelor&#8217;s in Linguistics from Reed College in 2005.  Since then, she has worked at the Center for Spoken Language Understanding at Oregon Health and Science University, helping to automatically diagnose neurological disorders by analyzing the syntactic and phonetic characteristics of spoken language.  She has also received a Master&#8217;s in Computational Linguistics from the University of Washington and is working towards a Ph.D in Computing Science at the University of Aberdeen.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/hltcoe.wordpress.com/360/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/hltcoe.wordpress.com/360/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/hltcoe.wordpress.com/360/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/hltcoe.wordpress.com/360/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/hltcoe.wordpress.com/360/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/hltcoe.wordpress.com/360/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/hltcoe.wordpress.com/360/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/hltcoe.wordpress.com/360/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/hltcoe.wordpress.com/360/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/hltcoe.wordpress.com/360/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/hltcoe.wordpress.com/360/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/hltcoe.wordpress.com/360/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/hltcoe.wordpress.com/360/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/hltcoe.wordpress.com/360/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=hltcoe.jhu.edu&amp;blog=26761117&amp;post=360&amp;subd=hltcoe&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://hltcoe.jhu.edu/2012/02/21/march-5-2012-margaret-mitchell/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/308742bc09c1585d68805c9dd233753e?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">kdaught2</media:title>
		</media:content>
	</item>
		<item>
		<title>Feb. 27, 2012: Kevin Gimpel: Statistical Modeling and Learning for Machine Translation</title>
		<link>http://hltcoe.jhu.edu/2012/02/16/feb-27-2012-statistical-modeling-and-learning-for-machine-translation-kevin-gimpel/</link>
		<comments>http://hltcoe.jhu.edu/2012/02/16/feb-27-2012-statistical-modeling-and-learning-for-machine-translation-kevin-gimpel/#comments</comments>
		<pubDate>Thu, 16 Feb 2012 14:23:36 +0000</pubDate>
		<dc:creator>kdaught2</dc:creator>
				<category><![CDATA[Talks]]></category>

		<guid isPermaLink="false">http://hltcoe.jhu.edu/?p=347</guid>
		<description><![CDATA[Kevin Gimpel , Carnegie Mellon University “Statistical Modeling and Learning for Machine Translation” Recent years have seen a flurry of research in translation modeling for statistical machine translation. Widely-used approaches include (1) models based on flat phrase-to-phrase mappings, and (2) models that use syntactic structure. I will present an approach that combines the strengths of [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=hltcoe.jhu.edu&amp;blog=26761117&amp;post=347&amp;subd=hltcoe&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>Kevin Gimpel , Carnegie Mellon University</p>
<p style="text-align:left;" align="center">“Statistical Modeling and Learning for Machine Translation”</p>
<p>Recent years have seen a flurry of research in translation modeling for statistical machine translation. Widely-used approaches include (1) models based on flat phrase-to-phrase mappings, and (2) models that use syntactic structure. I will present an approach that combines the strengths of these two in a single model. Experiments show that it leads to improved translation quality over state-of-the-art systems. When supervised syntactic parsers are not available, I will show that unsupervised parsers can be substituted with minimal loss in translation quality. I will also discuss the problem of tuning model parameters. An abundance of techniques has been developed by the statistical machine learning community, but the machine translation problem is fundamentally different from other structure prediction tasks in key ways. These differences have caused well-known learning algorithms to lose theoretical guarantees when applied to machine translation. I will propose a novel algorithm that does offer theoretical guarantees and shows empirical advantage over state-of-the-art approaches.</p>
<p>BIO:</p>
<p>Kevin Gimpel is a PhD student in the Language Technologies Institute at Carnegie Mellon University where he is advised by Noah Smith. His research focuses on machine translation, with supporting interests in natural language processing and machine learning. He is also interested in new tasks involving emerging data sources, including social media, movie reviews, and restaurant menus. He interned with the machine translation team at Google during summer 2009 and has been a Sandia National Laboratories Excellence in Science and Technology Fellow since 2010.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/hltcoe.wordpress.com/347/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/hltcoe.wordpress.com/347/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/hltcoe.wordpress.com/347/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/hltcoe.wordpress.com/347/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/hltcoe.wordpress.com/347/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/hltcoe.wordpress.com/347/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/hltcoe.wordpress.com/347/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/hltcoe.wordpress.com/347/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/hltcoe.wordpress.com/347/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/hltcoe.wordpress.com/347/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/hltcoe.wordpress.com/347/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/hltcoe.wordpress.com/347/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/hltcoe.wordpress.com/347/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/hltcoe.wordpress.com/347/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=hltcoe.jhu.edu&amp;blog=26761117&amp;post=347&amp;subd=hltcoe&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://hltcoe.jhu.edu/2012/02/16/feb-27-2012-statistical-modeling-and-learning-for-machine-translation-kevin-gimpel/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/308742bc09c1585d68805c9dd233753e?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">kdaught2</media:title>
		</media:content>
	</item>
		<item>
		<title>Feb. 20, 2012: Lidan Wang: Learning to Efficiently Rank</title>
		<link>http://hltcoe.jhu.edu/2012/02/09/feb-20-2012-learning-to-efficiently-rank-lidan-wang/</link>
		<comments>http://hltcoe.jhu.edu/2012/02/09/feb-20-2012-learning-to-efficiently-rank-lidan-wang/#comments</comments>
		<pubDate>Thu, 09 Feb 2012 17:07:01 +0000</pubDate>
		<dc:creator>kdaught2</dc:creator>
				<category><![CDATA[Talks]]></category>

		<guid isPermaLink="false">http://hltcoe.jhu.edu/?p=340</guid>
		<description><![CDATA[Lidan Wang, University of Maryland “Learning to Efficiently Rank” Technological advances have led to increases in the types and amounts of data, and there is a great need for developing methods to manage and find relevant information from such data to satisfy user&#8217;s information needs. Learning to rank is an emerging discipline at the intersection [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=hltcoe.jhu.edu&amp;blog=26761117&amp;post=340&amp;subd=hltcoe&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>Lidan Wang, University of Maryland</p>
<p>“Learning to Efficiently Rank”</p>
<p>Technological advances have led to increases in the types and amounts of data, and there is a great need for developing methods to manage and find relevant information from such data to satisfy user&#8217;s information needs. Learning to rank is an emerging discipline at the intersection of machine learning, data mining, and information retrieval. It develops principled machine learning algorithms to construct ranking (i.e., retrieval) models, for finding and ranking relevant information to user queries over large amounts of data. Although learning to rank approaches are capable of learning highly effective ranking functions, they have mostly ignored the important issue of model efficiency (i.e., model speed). Given that efficiency and effectiveness are competing forces that often counteract each other, models that are optimized for effectiveness alone may not meet the strict efficiency requirements when dealing with real-world large-scale data-sets.</p>
<p>My PhD thesis introduces the Learning to Efficiently Rank framework for learning large-scale ranking models that facilitate fast and effective retrieval, by exploiting and optimizing the tradeoffs between model complexity (i.e., speed) and accuracy.  At a basic level, this framework learns ranking models whose speed and accuracy can be explicitly controlled.  I proposed and designed solutions for three problems within this framework: 1) learning large-scale ranking models according to a desired tradeoff between model speed and accuracy; 2) constructing temporally-constrained models capable of returning results under time budgets; 3) breaking through the speed/accuracy tradeoff barrier by developing a novel cascade ranking model, and learning the cascade model structure and parameters with a novel boosting-based learning algorithm. My research extends the conventional effectiveness-centric approach in model learning and takes an efficiency-minded look at building effective retrieval models.  Results show that models learned this way significantly outperform traditional machine-learned models in terms of speed without sacrificing result effectiveness. Moreover, the new models work particularly well when users impose stringent time requirements for ranked retrieval on very large data-sets.</p>
<p>Bio:</p>
<p>Lidan Wang is a PhD candidate in the Computer Science Department at the University of Maryland, College Park. She received her Master&#8217;s degree from the Department of Computer Science at the University of Wisconsin, Madison, and Bachelor&#8217;s degree from the Department of Computer Science at the University of Florida. Lidan&#8217;s research interests lie at the intersection of machine learning, information retrieval, and text and data mining. Lidan&#8217;s work focuses on designing large-scale machine learning and information retrieval techniques for learning, mining, and retrieving information at scale. Her PhD dissertation research led to a recent NSF research grant (IIS-1144034), which she co-authored.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/hltcoe.wordpress.com/340/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/hltcoe.wordpress.com/340/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/hltcoe.wordpress.com/340/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/hltcoe.wordpress.com/340/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/hltcoe.wordpress.com/340/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/hltcoe.wordpress.com/340/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/hltcoe.wordpress.com/340/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/hltcoe.wordpress.com/340/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/hltcoe.wordpress.com/340/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/hltcoe.wordpress.com/340/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/hltcoe.wordpress.com/340/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/hltcoe.wordpress.com/340/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/hltcoe.wordpress.com/340/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/hltcoe.wordpress.com/340/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=hltcoe.jhu.edu&amp;blog=26761117&amp;post=340&amp;subd=hltcoe&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://hltcoe.jhu.edu/2012/02/09/feb-20-2012-learning-to-efficiently-rank-lidan-wang/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://1.gravatar.com/avatar/308742bc09c1585d68805c9dd233753e?s=96&#38;d=identicon&#38;r=G" medium="image">
			<media:title type="html">kdaught2</media:title>
		</media:content>
	</item>
	</channel>
</rss>
