<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	xmlns:georss="http://www.georss.org/georss" xmlns:geo="http://www.w3.org/2003/01/geo/wgs84_pos#" xmlns:media="http://search.yahoo.com/mrss/"
	>

<channel>
	<title>Intentialicious: Markus Strohmaier&#039;s Weblog</title>
	<atom:link href="http://mstrohm.wordpress.com/feed/" rel="self" type="application/rss+xml" />
	<link>http://mstrohm.wordpress.com</link>
	<description>agents, goals &#38; social computation on the web</description>
	<lastBuildDate>Sat, 17 Dec 2011 16:42:00 +0000</lastBuildDate>
	<language>en</language>
	<sy:updatePeriod>hourly</sy:updatePeriod>
	<sy:updateFrequency>1</sy:updateFrequency>
	<generator>http://wordpress.com/</generator>
<cloud domain='mstrohm.wordpress.com' port='80' path='/?rsscloud=notify' registerProcedure='' protocol='http-post' />
<image>
		<url>http://s2.wp.com/i/buttonw-com.png</url>
		<title>Intentialicious: Markus Strohmaier&#039;s Weblog</title>
		<link>http://mstrohm.wordpress.com</link>
	</image>
	<atom:link rel="search" type="application/opensearchdescription+xml" href="http://mstrohm.wordpress.com/osd.xml" title="Intentialicious: Markus Strohmaier&#039;s Weblog" />
	<atom:link rel='hub' href='http://mstrohm.wordpress.com/?pushpress=hub'/>
		<item>
		<title>CfP ACM Hypertext and Social Media 2012</title>
		<link>http://mstrohm.wordpress.com/2011/11/15/cfp-acm-hypertext-and-social-media-2012/</link>
		<comments>http://mstrohm.wordpress.com/2011/11/15/cfp-acm-hypertext-and-social-media-2012/#comments</comments>
		<pubDate>Tue, 15 Nov 2011 09:45:39 +0000</pubDate>
		<dc:creator>Markus Strohmaier</dc:creator>
				<category><![CDATA[Uncategorized]]></category>

		<guid isPermaLink="false">http://mstrohm.wordpress.com/?p=539</guid>
		<description><![CDATA[I&#8217;d like to point you to the following Call for Papers &#8211; make sure to consider submitting your research! 23rd International Conference ACM Hypertext and Social Media (HT&#8217;2012) http://www.ht2012.org June 25-28, 2012 Milwaukee, WI, USA &#160; The ACM Hypertext and Social Media conference is a premium venue for high quality peer-reviewed research on hypertext theory, [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=539&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>I&#8217;d like to point you to the following Call for Papers &#8211; make sure to consider submitting your research!</p>
<blockquote>
<blockquote><p><strong>23rd International Conference ACM Hypertext and Social Media (HT&#8217;2012)</strong> <a href="http://www.ht2012.org">http://www.ht2012.org</a> June 25-28, 2012 Milwaukee, WI, USA</p>
<p>&nbsp;</p></blockquote>
<blockquote><p>The ACM Hypertext and Social Media conference is a premium venue for high quality peer-reviewed research on hypertext theory, systems and applications. It is concerned with all aspects of modern hypertext research including social media, semantic web, dynamic and computed hypertext and hypermedia as well as narrative systems and applications. The ACM Hypertext and Social Media 2012 conference will focus on exploring, studying and shaping relationships between four important dimensions of links in hypertextual systems and the World Wide Web: people, data, resources and stories.</p></blockquote>
<blockquote><p><strong>Conference tracks and track co-chairs:</strong></p></blockquote>
<blockquote><p>Track 1: <a href="http://www.ht2012.org/tracks/social.xml">Social Media</a> (Linking people)<br />
Claudia Müller-Birn, Freie Universität Berlin, Germany<br />
Munmun De Choudhury, Microsoft Research, USA</p></blockquote>
<blockquote><p>Track 2: <a href="http://www.ht2012.org/tracks/data.xml">Semantic Data</a> (Linking data)<br />
Harith Alani, Open University, UK<br />
Alexandre Passant, DERI, Ireland</p></blockquote>
<blockquote><p>Track 3: <a href="http://www.ht2012.org/tracks/resources.xml">Adaptive Hypertext and Hypermedia</a> (Linking resources)<br />
Jill Freyne, CSIRO, Australia<br />
Shlomo Berkovsky, CSIRO, Australia</p></blockquote>
<blockquote><p>Track 4: <a href="http://www.ht2012.org/tracks/narrative.xml">Hypertext and Narrative Connections</a> (Linking stories)<br />
Andrew S. Gordon, University of Southern California, USA<br />
Frank Nack, University of Amsterdam, The Netherlands</p></blockquote>
<blockquote><p><strong>Important Dates and Submission:</strong></p></blockquote>
<blockquote><p><strong>Full and Short Paper Submission</strong>: Monday Feb 6 2012</p></blockquote>
<blockquote><p><strong>Notification</strong>: Wednesday March 21 2012</p></blockquote>
<blockquote><p><strong>Final Version</strong>: Monday April 23 2012 Submission details are available at <a href="http://www.ht2012.org">http://www.ht2012.org</a></p></blockquote>
<blockquote><p>Submissions will be accepted via <a href="https://www.easychair.org/conferences/?conf=ht2012">https://www.easychair.org/conferences/?conf=ht2012</a></p>
<p><strong>Organization Committee:</strong></p></blockquote>
<blockquote><p>General Chair: Ethan Munson, University of Wisconsin &#8211; Milwaukee, USA</p></blockquote>
<blockquote><p>PC Chair: Markus Strohmaier, Graz University of Technology, Austria</p></blockquote>
<blockquote><p>Publicity Chair: Alvin Chin, Nokia Research Beijing, China</p></blockquote>
</blockquote>
<br />Filed under: <a href='http://mstrohm.wordpress.com/category/uncategorized/'>Uncategorized</a>  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/mstrohm.wordpress.com/539/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/mstrohm.wordpress.com/539/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/mstrohm.wordpress.com/539/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/mstrohm.wordpress.com/539/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/mstrohm.wordpress.com/539/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/mstrohm.wordpress.com/539/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/mstrohm.wordpress.com/539/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/mstrohm.wordpress.com/539/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/mstrohm.wordpress.com/539/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/mstrohm.wordpress.com/539/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/mstrohm.wordpress.com/539/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/mstrohm.wordpress.com/539/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/mstrohm.wordpress.com/539/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/mstrohm.wordpress.com/539/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=539&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://mstrohm.wordpress.com/2011/11/15/cfp-acm-hypertext-and-social-media-2012/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">Markus</media:title>
		</media:content>
	</item>
		<item>
		<title>What is the size of the Library of Twitter?</title>
		<link>http://mstrohm.wordpress.com/2011/02/22/what-is-the-size-of-a-library-of-twitter/</link>
		<comments>http://mstrohm.wordpress.com/2011/02/22/what-is-the-size-of-a-library-of-twitter/#comments</comments>
		<pubDate>Tue, 22 Feb 2011 05:57:48 +0000</pubDate>
		<dc:creator>Markus Strohmaier</dc:creator>
				<category><![CDATA[Uncategorized]]></category>

		<guid isPermaLink="false">http://mstrohm.wordpress.com/?p=525</guid>
		<description><![CDATA[The Library of Babel is a theoretical library that holds the sum of all books that can be written with (i) a given set of symbols and (ii) a given page limit. According to Wikipedia, the Library of Babel is based on a short story by the author and librarian Jorge Luis Borges (1899–1986). Its [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=525&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>The <strong>Library of Babel </strong>is a theoretical library that holds the sum of all books that can be written with (i) a given set of symbols and (ii) a given page limit. According to <a href="http://en.wikipedia.org/wiki/The_Library_of_Babel">Wikipedia</a>, the Library of Babel is based on a short story by the author and librarian <strong>Jorge Luis Borges </strong>(1899–1986). Its idea is simple: the library holds all books that can be produced by every combinatorially possible sequence of symbols up to a certain book length. In Jorge Luis Borges case, the Library is immensly large since it contains all possible books up to 410 pages. The <a href="http://www.americanscientist.org/bookshelf/pub/books-a-million">American Scientist calculates</a>:</p>
<blockquote><p>&#8230; each book has 410 pages, with 40 lines of 80 characters on each page. Thus a book consists of 410 [pages] × 40 [lines] × 80 [characters] = 1,312,000 symbols. There are 25  choices for each of these symbols, and so the library’s collection  consists of 25<sup>1,312,000</sup> books.</p></blockquote>
<p>But <strong>what is the size of a Library of Twitter</strong>, i.e. the size of the set of all theoretically possible tweets? It should be (i) much smaller and (ii) much easier to calculate due to the particular structure of tweets. Here&#8217;s a brief back-of-the-envelope calculation:</p>
<p>Given the 140 character limit of tweets, and assuming an english vocabulary of 26 symbols expanded by basic syntactical elements such as punctuation (.), commas (,), spaces ( ), at signs (@), hashs (#) and a few others, we end up with 140 characters and all combinatorially possible sequences of a vocabulary of maybe 50 symbols. Based on these (conservative) assumptions, the Library of Twitter holds at least  50<sup>140</sup> tweets.</p>
<p>In other words, <strong>the size of the Library of Twitter is at least 7.17 × 10<sup>237</sup></strong> [1] or:</p>
<blockquote>
<pre>7174648137343063403129495466444370592154941142407760751396189613515730343351606279611587524414062500000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000000</pre>
</blockquote>
<p>While this number seems impressive, it pales in comparison to the size of the Library of Babel (which is 1.956 <strong>× </strong>10<sup>1834097</sup>). As with the Library of Babel, most of the Library of Twitter contents would be non-sensical. But on the upside, the library would also <strong>contain all tweets ever written in the past and all theoretically possible tweets to be written in the future</strong>. Thereby, 50<sup>140 </sup>is an upper bound on the information that can be conveyed in 140 characters given a vocabulary of 50 symbols [2]. This first approximate upper bound should be informative for future studies of Twitter to answer questions such as: How many of the theoretically possible tweets have already been written &#8211; or in other words &#8211; how much is there left to write before we run out of (sensical) combinatorial options?</p>
<p>I&#8217;ll leave it to somebody else to calculate the number of bits and hard drives necessary to store, mine and search the Library of Twitter.</p>
<p>[1] all numbers calculated with <a href="http://www.wolframalpha.com/">WolframAlpha</a><br />
[2] It is obvious that larger assumed vocabularies would significantly increase the size of the library.</p>
<br />Filed under: <a href='http://mstrohm.wordpress.com/category/uncategorized/'>Uncategorized</a>  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/mstrohm.wordpress.com/525/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/mstrohm.wordpress.com/525/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/mstrohm.wordpress.com/525/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/mstrohm.wordpress.com/525/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/mstrohm.wordpress.com/525/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/mstrohm.wordpress.com/525/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/mstrohm.wordpress.com/525/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/mstrohm.wordpress.com/525/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/mstrohm.wordpress.com/525/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/mstrohm.wordpress.com/525/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/mstrohm.wordpress.com/525/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/mstrohm.wordpress.com/525/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/mstrohm.wordpress.com/525/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/mstrohm.wordpress.com/525/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=525&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://mstrohm.wordpress.com/2011/02/22/what-is-the-size-of-a-library-of-twitter/feed/</wfw:commentRss>
		<slash:comments>6</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">Markus</media:title>
		</media:content>
	</item>
		<item>
		<title>Programming Poems with Mechanical Turk</title>
		<link>http://mstrohm.wordpress.com/2010/12/29/programming-poems-with-mechanical-turk/</link>
		<comments>http://mstrohm.wordpress.com/2010/12/29/programming-poems-with-mechanical-turk/#comments</comments>
		<pubDate>Wed, 29 Dec 2010 07:34:56 +0000</pubDate>
		<dc:creator>Markus Strohmaier</dc:creator>
				<category><![CDATA[research]]></category>
		<category><![CDATA[acrostic]]></category>
		<category><![CDATA[amazon]]></category>
		<category><![CDATA[creativity]]></category>
		<category><![CDATA[crowd programming]]></category>
		<category><![CDATA[crowdsourcing]]></category>
		<category><![CDATA[human computation]]></category>
		<category><![CDATA[mechanical turk]]></category>
		<category><![CDATA[poem programming]]></category>
		<category><![CDATA[poems]]></category>
		<category><![CDATA[poetry]]></category>
		<category><![CDATA[programming crowds]]></category>

		<guid isPermaLink="false">http://mstrohm.wordpress.com/?p=498</guid>
		<description><![CDATA[Mechanical Turk has received some bad press recently (this is one example). It has been pointed out that Mechanical Turk can be used to do evil, which got me interested in seeing whether if and how it can do any good (or at least: creative). This has led to the post here, and resulted in [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=498&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p><a href="http://www.mturk.com/">Mechanical Turk</a> has received some bad press recently (this is <a href="http://behind-the-enemy-lines.blogspot.com/2010/12/mechanical-turk-now-with-4092-spam.html">one example</a>). It has been pointed out that Mechanical Turk can be used to do evil, which got me interested in seeing whether if and how it can do any good (or at least: creative). This has led to the post here, and resulted in the following poem &#8211; collaboratively produced by independent workers on Mechanical Turk.</p>
<blockquote>
<p style="text-align:center;"><em>In the daily life of a Mechanical Turk</em></p>
<p><strong>I</strong>n the daily life of a Mechanical Turk,<br />
<strong>N</strong>ever have I quite finished my work,</p>
<p><strong>F</strong>or I return and refresh and come back for more<br />
<strong>I</strong>n quest of a yet higher score</p>
<p><strong>N</strong>ow and then my eyes may tire<br />
<strong>I</strong>f I said they didn&#8217;t, I&#8217;d be a liar</p>
<p><strong>T</strong>hough I am spent, It&#8217;s hard to stop<br />
<strong>E</strong>ven when I&#8217;m ready to drop</p>
<p><strong>M</strong>y available HITs are waiting for me<br />
<strong>O</strong>cassionally I&#8217;d rather go and watch TV</p>
<p><strong>N</strong>evertheless, I need the cash<br />
<strong>K</strong>een to throw a birthday bash!</p>
<p><strong>E</strong>ver so slowly my earnings increase<br />
<strong>Y</strong>et my passion for Mechanical Turk would never cease &#8230;</p></blockquote>
<p>The structure of the poem is fully algorithmically determined. It has been written collaboratively by a crowd of Mechanical Turkers interacting with each other only through HITs. Before designing the poem algorithm, I&#8217;ve done some research on the structure and different types of poems, which led me to <em>Acrostics</em>.</p>
<blockquote><p>&#8220;An <strong>acrostic</strong> (<a title="Greek language" href="http://en.wikipedia.org/wiki/Greek_language">Greek</a>: <em>ákros</em> &#8220;top&#8221;; <em>stíchos</em> &#8220;verse&#8221;) is a <a title="Poetry" href="http://en.wikipedia.org/wiki/Poetry">poem</a> or other form of writing in which the first letter, syllable or word of each line, <a href="http://en.wikipedia.org/wiki/Paragraph">paragraph</a> or other recurring feature in the text spells out a word or a message.&#8221; (<a href="http://en.wikipedia.org/wiki/Acrostic">wikipedia</a>)</p></blockquote>
<p>In my poem algorithm, I&#8217;ve constrained the first letter of each sentence in the poem, thereby forming an acrostic. As an additional constraint, I required the poem to consist of pairs of sentences that rhyme (similar to a <a href="http://en.wikipedia.org/wiki/Limerick_%28poetry%29">Limerick</a>).</p>
<p>While I determined (i.e. programmed) the structure of the poem, the content was completely produced by mechanical turkers. The only input provided was the title, which acts as the first sentence of the poem as well. Each rhyming pair of sentences was written by 2 different turkers, i.e. the output of one turker was used as an input for another turker. Total price of the poem was 1.804 USD. The poem was built incrementally, each subsequent turker had access to the output of all previous turkers. All tasks were requested at least 3 times, selection among alternatives was done by me, although it could have easily been done by Turkers themselves. In total, the contributions of 7 different Turkers were used in the poem above (while many more have worked on the HITs).</p>
<p>With that, I&#8217;ve initialized the poem algorithm with the acrostic &#8220;<strong>Infinite Monkey</strong>&#8221; and the title &#8220;<em>In the daily life of a Mechanical Turk</em>&#8221; and ran it on Mechanical Turk. The result can be seen above.</p>
<p>The Infinite Monkey acrostic refers to the Infinite Monkey Theorem:</p>
<blockquote><p>&#8220;The <strong>Infinite Monkey Theorem </strong>states that a monkey hitting keys at random on a typewriter keyboard for an infinite amount of time will almost surely type a given text, such as the complete works of William Shakespeare.&#8221; (<a href="http://en.wikipedia.org/wiki/Infinite_monkey_theorem">Wikipedia</a>)</p></blockquote>
<p>That&#8217;s what we are trying to test here, in a less statistic and a more informed manner though. Instead of producing all possible poems, we are interested in producing constrained yet plausible poems, efficiently (i.e. in very few iterations).</p>
<p>Which leads to a variation of the Infite Monkey Theorem that I&#8217;d like to propose here:</p>
<blockquote><p>The <strong>Finite Turker Theorem </strong>states that a finite (yet potentially large) number of independent writers (here: Mechanical Turkers) will almost surely produce a poem that is creative, enjoyable and mostly indistinguishable from a single author poem.</p></blockquote>
<p>With the Finite Turker Theorem, and market places such as Mechanical Turk, it might be possible to outsource creative work &#8211; such as poem writing &#8211; to a large set of workers without much penalty in terms of beauty or enjoyability. Algorithms such as the one above can constraint and influence the resulting poems, giving greater control about the outcome of creative processes (which sounds like an oxymoron).</p>
<p>Because HITs were requested multiple times, there were several rejects that did not make it into the final poem, but which show some of the difficulties as well as the creative potential of programmed poems, including:</p>
<blockquote><p>&#8230;<br />
For I return and refresh and come back for more<br />
Info, my pimp: [I'm] a Dolores Labs penny whore<br />
&#8230;</p></blockquote>
<p><strong>Conclusion:</strong> It has been suggested that the primary use of Mechanical Turk is the execution of simple, easily replacable and often spam-related work. This little experiment suggests that Mechanical Turk can serve richer purposes, by tapping into the creative energy of an underestimated, underutilized but also (currently) underpaid work force.</p>
<br />Filed under: <a href='http://mstrohm.wordpress.com/category/research/'>research</a>  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/mstrohm.wordpress.com/498/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/mstrohm.wordpress.com/498/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/mstrohm.wordpress.com/498/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/mstrohm.wordpress.com/498/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/mstrohm.wordpress.com/498/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/mstrohm.wordpress.com/498/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/mstrohm.wordpress.com/498/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/mstrohm.wordpress.com/498/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/mstrohm.wordpress.com/498/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/mstrohm.wordpress.com/498/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/mstrohm.wordpress.com/498/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/mstrohm.wordpress.com/498/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/mstrohm.wordpress.com/498/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/mstrohm.wordpress.com/498/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=498&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://mstrohm.wordpress.com/2010/12/29/programming-poems-with-mechanical-turk/feed/</wfw:commentRss>
		<slash:comments>4</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">Markus</media:title>
		</media:content>
	</item>
		<item>
		<title>A game-with-a-purpose based on Twitter</title>
		<link>http://mstrohm.wordpress.com/2010/10/11/playing-buzzword-bingo-on-twitter/</link>
		<comments>http://mstrohm.wordpress.com/2010/10/11/playing-buzzword-bingo-on-twitter/#comments</comments>
		<pubDate>Mon, 11 Oct 2010 17:22:58 +0000</pubDate>
		<dc:creator>Markus Strohmaier</dc:creator>
				<category><![CDATA[research]]></category>
		<category><![CDATA[Uncategorized]]></category>
		<category><![CDATA[bingo]]></category>
		<category><![CDATA[games with a purpose]]></category>
		<category><![CDATA[tweets]]></category>
		<category><![CDATA[twitter]]></category>

		<guid isPermaLink="false">http://mstrohm.wordpress.com/?p=484</guid>
		<description><![CDATA[I am happy to announce that my research group at TU Graz has launched Bulltweetbingo!, a game-with-a-purpose based on Twitter, today. The game is already live and available at http://bingo.tugraz.at. For an introduction to the idea of Buzzword Bingo, please see the following IBM commercial (Youtube video). &#160; &#160; Rather than playing buzzword bingo while [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=484&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>I am happy to announce that my research group at TU Graz has launched Bulltweetbingo!, a game-with-a-purpose based on Twitter, today. The game is already live and available at <a href="http://bingo.tugraz.at/">http://bingo.tugraz.at</a>. For an introduction to the idea of Buzzword Bingo, please see the following IBM commercial (<a href="http://www.youtube.com/watch?v=cgeLY7CL5IE">Youtube video</a>).</p>
<p>&nbsp;</p>
<div id="attachment_487" class="wp-caption aligncenter" style="width: 310px"><a href="http://www.youtube.com/watch?v=cgeLY7CL5IE"><img class="size-medium wp-image-487 " title="Playing Buzzword Bingo on Twitter" src="http://mstrohm.files.wordpress.com/2010/10/playing-buzzword-bingo-on-twitter.jpg?w=300&#038;h=210" alt="" width="300" height="210" /></a><p class="wp-caption-text">IBM Innovation Buzzword Bingo (Youtube)</p></div>
<p>&nbsp;</p>
<p>Rather than playing buzzword bingo while listening to a talk, the idea of Bulltweetbingo! is to play Buzzword Bingo with the people you follow on Twitter. All people you follow on Twitter automatically participate in the game by tweeting. A Bulltweetbingo game terminates (i.e. hits &#8220;Bingo!&#8221;) if the people you follow on Twitter use a particular combination of the defined buzzwords in their tweets. We intend to use the data provided by each game in our research on analzying the semantics of short messages on systems such as Twitter or Facebook. Each game provides information about the relevance and topics of tweets for a particular person as well as some information on the topics of tweets that a person expects to receive in the future.</p>
<p>I&#8217;m copy&#8217;n pasting some more information about the game that we have made available on the game website  (<a href="http://bingo.tugraz.at/about">about the project</a>).</p>
<blockquote><p><strong>Bulltweetbingo! </strong><br />
Playing a game of bingo with people you follow on Twitter.</p>
<p><em>A team of researchers from Graz University of Technology, Austria has  developed one of the first games-with-a-purpose that is exclusively  based on Twitter.</em></p>
<p><em>The goal of this project is to annotate and to better understand the  short messages posted to so-called social awareness streams such as  Twitter or Facebook. Using this data, the researchers aim to improve the  ability of computers to effectively organize and make sense out of the  sea of short messages available today.</em></p>
<p><em>Dr. Markus Strohmaier, Assistant Professor at the Knowledge Management  Institute at Graz University of Technology, Austria explains: &#8220;While  social awareness streams such as Twitter or Facebook have experienced  significant popularity over the last few years, we know little about how  to best understand, search and organize the information that is  contained in them.&#8221;</em></p>
<p><em>To tackle this problem, the researchers have developed a game of  Buzzword Bingo that users can play with people they follow on Twitter.</em></p>
<p><em>&#8220;With each game users play on our website, we will collect data that  helps us develop more effective algorithms for better understanding this  new kind of data&#8221; Dr. Markus Strohmaier says, &#8220;and in addition to that,  we simply hope users would enjoy playing a game of Bingo on Twitter.  Each game is unique and exciting in a sense that users generally don’t  know what tweets people will publish during the course of a bingo game&#8221;.</em></p>
<p><em>The researchers have launched the site bulltweetbingo! and ask users  to sign up and to play a game of Bingo with the people they follow on  Twitter. Twitter users can sign up at <a href="http://bingo.tugraz.at">http://bingo.tugraz.at</a>.</em></p></blockquote>
<p>The game was implemented by one of my talented students, <a href="https://twitter.com/simon_walk">Simon Walk</a> &#8211; Make sure to hire him if you need a complex web project to be realized quickly and effectively!</p>
<br />Filed under: <a href='http://mstrohm.wordpress.com/category/research/'>research</a>, <a href='http://mstrohm.wordpress.com/category/uncategorized/'>Uncategorized</a>  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/mstrohm.wordpress.com/484/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/mstrohm.wordpress.com/484/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/mstrohm.wordpress.com/484/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/mstrohm.wordpress.com/484/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/mstrohm.wordpress.com/484/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/mstrohm.wordpress.com/484/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/mstrohm.wordpress.com/484/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/mstrohm.wordpress.com/484/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/mstrohm.wordpress.com/484/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/mstrohm.wordpress.com/484/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/mstrohm.wordpress.com/484/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/mstrohm.wordpress.com/484/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/mstrohm.wordpress.com/484/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/mstrohm.wordpress.com/484/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=484&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://mstrohm.wordpress.com/2010/10/11/playing-buzzword-bingo-on-twitter/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">Markus</media:title>
		</media:content>

		<media:content url="http://mstrohm.files.wordpress.com/2010/10/playing-buzzword-bingo-on-twitter.jpg?w=300" medium="image">
			<media:title type="html">Playing Buzzword Bingo on Twitter</media:title>
		</media:content>
	</item>
		<item>
		<title>Are Tag Clouds Useful for Navigating Social Media?</title>
		<link>http://mstrohm.wordpress.com/2010/08/16/are-tag-clouds-useful-for-navigating-social-media/</link>
		<comments>http://mstrohm.wordpress.com/2010/08/16/are-tag-clouds-useful-for-navigating-social-media/#comments</comments>
		<pubDate>Mon, 16 Aug 2010 14:12:01 +0000</pubDate>
		<dc:creator>Markus Strohmaier</dc:creator>
				<category><![CDATA[Uncategorized]]></category>
		<category><![CDATA[navigating]]></category>
		<category><![CDATA[navigation]]></category>
		<category><![CDATA[social computation]]></category>
		<category><![CDATA[social computing]]></category>
		<category><![CDATA[social media]]></category>
		<category><![CDATA[social tagging systems]]></category>
		<category><![CDATA[socialcom2010]]></category>
		<category><![CDATA[tag clouds]]></category>
		<category><![CDATA[tagging]]></category>
		<category><![CDATA[tags]]></category>

		<guid isPermaLink="false">http://mstrohm.wordpress.com/?p=463</guid>
		<description><![CDATA[This week, my colleague Denis Helic will present results from a recent collaboration investigating the usefulness of tag clouds at the IEEE SocialCom 2010 conference in Minneapolis, Minnesota, USA. In this paper (download pdf), we investigated if and to what extent tag clouds &#8211; a popular mechanism for interacting with social media &#8211; are useful [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=463&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>This week, my colleague <a href="http://coronet.iicm.tugraz.at/denis/homepage/">Denis Helic</a> will present results from a recent collaboration investigating the usefulness of tag clouds at the IEEE <a href="http://www.iisocialcom.org/conference/socialcom2010/">SocialCom 2010</a> conference in Minneapolis, Minnesota, USA. In this paper (<a href="http://kmi.tugraz.at/staff/markus/documents/2010_SocialCom2010_Navigability.pdf">download pdf</a>), we investigated if and to what extent tag clouds &#8211; a  popular mechanism for interacting with social media &#8211; are useful for  navigation.</p>
<div id="attachment_465" class="wp-caption aligncenter" style="width: 310px"><a href="http://mstrohm.files.wordpress.com/2010/08/tagcloud.jpg"><img class="size-medium wp-image-465" title="Are Tag Clouds Useful for Navigating Social Tagging Systems?" src="http://mstrohm.files.wordpress.com/2010/08/tagcloud.jpg?w=300&#038;h=95" alt="" width="300" height="95" /></a><p class="wp-caption-text">An Exemplary Tag Cloud from Flickr.com</p></div>
<p>While tag clouds can potentially serve different purposes, there seems to be an implicit assumption among engineers of social tagging systems that tag clouds are specifically useful to support navigation. This is evident in the large-scale adoption of tag clouds for interlinking resources in numerous systems such as Flickr, Delicious, and BibSonomy. However, this <strong>Navigability Assumption </strong>has hardly been critically reflected (with some notable exceptions, for example [1]), and has largely remained untested in the past. In this paper, we demonstrate that the prevalent approach to tag cloud-based navigation in social tagging systems is highly problematic with regard to network-theoretic measures of navigability. In a series of experiments, we will show that the Navigability Assumption <strong>only holds in very specific settings</strong>, and for the most common scenarios, we can assert that it is <strong>wrong</strong>.</p>
<p>While recent research has studied navigation in social tagging systems from user interface [2], [3], [4] and network-theoretic [5] perspectives, the unique focus of this paper is the intersection of these issues. This paper provides answers to questions such as: How do user interface constraints of tag clouds affect the navigability of tagging systems? And how efficient is navigation via tag clouds from a network-theoretic perspective? Particularly, we first 1) investigate the intrinsic navigability of tagging datasets without considering user interface effects, and then 2) take pragmatic user interface constraints into account. We 3) will demonstrate that for many social tagging systems, the so-called Navigability Assumption does not hold and we will finally 4) use our findings to illuminate a path towards improving the navigability of tag clouds.</p>
<p>Here&#8217;s the abstract:</p>
<blockquote><p><strong>Abstract</strong>: It is a widely held belief among designers of social tagging systems that tag clouds represent a useful tool for navigation. This is evident in, for example, the increasing number of tagging systems offering tag clouds for navigational purposes, which hints towards an implicit assumption that tag clouds support efficient navigation. In this paper, we examine and test this assumption from a network-theoretic perspective, and show that in many cases it does not hold. We first model navigation in tagging systems as a bipartite graph of tags and resources and then simulate the navigation process in such a graph. We use network-theoretic properties to analyse the navigability of three tagging datasets with regard to different user interface restrictions imposed by tag clouds. Our results confirm that tag-resource networks have efficient navigation properties in theory, but they also show that popular user interface decisions (such as “pagination” combined with reverse-chronological listing of resources) significantly impair the potential of tag clouds as a useful tool for navigation. Based on our findings, we identify a number of avenues for further research and the design of novel tag cloud construction algorithms. Our work is relevant for researchers interested in navigability of emergent hypertext structures, and for engineers seeking to improve the navigability of social tagging systems.</p></blockquote>
<p>The results presented in this paper make a theoretical and an empirical argument against existing approaches to tag cloud construction. Our work thereby both confirms and refutes the assumption that current tag cloud incarnations are a useful tool for navigating social tagging systems. While we confirm that tag-resource networks have efficient navigational properties in theory, we show that popular user interface decisions (such as “pagination” combined with reverse-chronological listing of resources) significantly impair navigability. Our experimental results demonstrate that popular approaches to using tag clouds for navigational purposes suffer from significant problems. We conclude that in order to make full use of the potential of tag clouds for navigating social tagging systems, new and more sophisticated ways of thinking about designing tag cloud algorithms are needed.</p>
<p>Here&#8217;s the full reference for the paper, and a link to the pdf as well as to preliminary slides:</p>
<p><strong>Reference and PDF Download:</strong> D. Helic, C. Trattner, M. Strohmaier and K. Andrews, <a href="http://kmi.tugraz.at/staff/markus/documents/2010_SocialCom2010_Navigability.pdf">On the Navigability of Social Tagging Systems</a>, The 2nd IEEE International  Conference on Social Computing (SocialCom 2010), Minneapolis, Minnesota, USA, 2010.  (<em><span style="color:#ff0000;">download</span> </em><a href="http://kmi.tugraz.at/staff/markus/documents/2010_SocialCom2010_Navigability.pdf">pdf</a>) (<a href="http://www.slideshare.net/mstrohm/on-the-navigability-of-social-tagging-systems">related slides</a>)</p>
<p>Further references:</p>
<p>[1] M. A. Hearst and D. Rosner, “Tag clouds: Data analysis tool or social signaller?” in HICSS ’08: Proceedings of the Proceedings of the 41st Annual Hawaii International Conference on System Sciences. Washington, DC, USA: IEEE Computer Society, 2008.<br />
[2] C. S. Mesnage and M. J. Carman, “Tag navigation,” in SoSEA ’09: Proceedings of the 2nd international workshop on Social software engineering and applications. New York, NY, USA: ACM, 2009, pp. 29–32.<br />
[3] A. W. Rivadeneira, D. M. Gruen, M. J. Muller, and D. R. Millen, “Getting our head in the clouds: toward evaluation studies of tagclouds,” in CHI ’07: Proceedings of the SIGCHI conference on Human factors in computing systems. New York, NY, USA: ACM, 2007, pp. 995–998.<br />
[4] J. Sinclair and M. Cardew-Hall, “The folksonomy tag cloud: when is it useful?” Journal of Information Science, vol. 34, p. 15, 2008. [Online]. Available: http://jis.sagepub.com/cgi/content/abstract/34/1/15<br />
[5] N. Neubauer and K. Obermayer, “Hyperincident connected components of tagging networks,” in HT ’09: Proceedings of the 20th ACM conference on Hypertext and hypermedia. New York, NY, USA: ACM, 2009, pp. 229–238.</p>
<br />Filed under: <a href='http://mstrohm.wordpress.com/category/uncategorized/'>Uncategorized</a>  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/mstrohm.wordpress.com/463/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/mstrohm.wordpress.com/463/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/mstrohm.wordpress.com/463/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/mstrohm.wordpress.com/463/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/mstrohm.wordpress.com/463/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/mstrohm.wordpress.com/463/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/mstrohm.wordpress.com/463/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/mstrohm.wordpress.com/463/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/mstrohm.wordpress.com/463/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/mstrohm.wordpress.com/463/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/mstrohm.wordpress.com/463/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/mstrohm.wordpress.com/463/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/mstrohm.wordpress.com/463/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/mstrohm.wordpress.com/463/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=463&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://mstrohm.wordpress.com/2010/08/16/are-tag-clouds-useful-for-navigating-social-media/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">Markus</media:title>
		</media:content>

		<media:content url="http://mstrohm.files.wordpress.com/2010/08/tagcloud.jpg?w=300" medium="image">
			<media:title type="html">Are Tag Clouds Useful for Navigating Social Tagging Systems?</media:title>
		</media:content>
	</item>
		<item>
		<title>On taxonomies, folksonomies, and tweetonomies</title>
		<link>http://mstrohm.wordpress.com/2010/04/17/on-taxonomies-folksonomies-and-tweetonomies/</link>
		<comments>http://mstrohm.wordpress.com/2010/04/17/on-taxonomies-folksonomies-and-tweetonomies/#comments</comments>
		<pubDate>Sat, 17 Apr 2010 09:29:41 +0000</pubDate>
		<dc:creator>Markus Strohmaier</dc:creator>
				<category><![CDATA[research]]></category>
		<category><![CDATA[folksonomy]]></category>
		<category><![CDATA[knowledge]]></category>
		<category><![CDATA[knowledge acquisition]]></category>
		<category><![CDATA[knowledge capture]]></category>
		<category><![CDATA[semsearch2010]]></category>
		<category><![CDATA[social awareness streams]]></category>
		<category><![CDATA[social media]]></category>
		<category><![CDATA[taxonomy]]></category>
		<category><![CDATA[tweetonomies]]></category>
		<category><![CDATA[tweetonomy]]></category>
		<category><![CDATA[tweets]]></category>
		<category><![CDATA[twitter]]></category>
		<category><![CDATA[www2010]]></category>

		<guid isPermaLink="false">http://mstrohm.wordpress.com/?p=412</guid>
		<description><![CDATA[For centuries, taxonomies have been a tool for mankind to bring structure to the world. Taxonomies (wikipedia: &#8220;the practice and science of classification&#8221;) were developed in different fields of science, including &#8211; but not limited to &#8211; biology (e.g. taxonomies of animals) or library sciences (e.g. taxonomies of literature). Regardless of the particular domain of [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=412&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<div id="attachment_427" class="wp-caption alignleft" style="width: 112px"><a href="http://mstrohm.files.wordpress.com/2010/04/dessert-taxonomy1.jpg"><img class="size-thumbnail wp-image-427 " title="On taxonomies, folksonomies and tweetonomies" src="http://mstrohm.files.wordpress.com/2010/04/dessert-taxonomy1.jpg?w=102&#038;h=150" alt="" width="102" height="150" /></a><p class="wp-caption-text">Towards a Taxonomy of Meta-Desserts (by several_bees @flickr)</p></div>
<p>For centuries, <strong>taxonomies </strong>have been a tool for mankind to bring structure to the world. Taxonomies (<a href="http://en.wikipedia.org/wiki/Taxonomy">wikipedia</a>: <em>&#8220;the  practice and science of classification&#8221;</em>) were developed in different fields of science, including &#8211; but not limited to &#8211; biology (e.g. taxonomies of animals) or library sciences (e.g. <a href="http://en.wikipedia.org/wiki/Dewey_Decimal_Classification">taxonomies of literature</a>). Regardless of the particular domain of application, in most cases those taxonomies were developed by a selected few (e.g. librarians), and were used by many.</p>
<p>With the emergence of personal computers and file directories, the task of taxonomy development was brought to the masses. Suddenly everyone (i.e. every computer user) was in charge of developing, maintaining and transforming personal taxonomical structures in order to organize and (re-)find resources. While this development has led to a vast increase of personal taxonomies, it was only since <a href="http://www.delicious.com">del.icio.us</a> has popularized tagging as a new form of resource organization that users&#8217; personal taxonomies were exposed publicly. This has made it possible to aggregate a large number of personal taxonomies into collective taxonomic structures. The result of such aggregation has since then been refered to as <strong><a href="http://www.vanderwal.net/folksonomy.html">folksonomies</a></strong>, i.e. an emergent structure collectively produced by a large number of users in a bottom-up manner.</p>
<p>In social awareness streams (<a href="http://infolab.stanford.edu/~mor/research/naamanCSCW10.pdf">pdf</a>) such as Twitter of Facebook, users typically do not aim to classify or organize resources, but they engage in casual chatter and dialogue, ocassionally using syntax to coordinate communication (such as #<a href="http://factoryjoe.com/blog/2007/08/25/groups-for-twitter-or-a-proposal-for-twitter-tag-channels/">hashtags</a> or @replies). Taxonomic structures can be assumed to play a subordinate role for users of social awareness streams.</p>
<p>In a recent paper to be presented at the SemSearch Workshop at WWW2010 [<a href="#1">1</a>] however, we show that there exist latent conceptual structures &#8211; similar to taxonomies or folksonomies &#8211; in social awareness streams, and that we can acquire these structures through simple aggregation mechanisms.</p>
<blockquote><p><strong>Abstract: </strong><em>Although one might argue that little wisdom can be conveyed in messages of 140 characters or less, this paper sets out to explore whether the aggregation of messages in social awareness streams, such as Twitter, conveys meaningful information about a given domain. As a research community, we know little about the structural and semantic properties of such streams, and how they can be analyzed, characterized and used. This paper introduces a network-theoretic model of social awareness streams, a so-called &#8220;tweetonomy&#8221;, together with a set of stream-based measures that allow researchers to systematically define and compare different stream aggregations. We apply the model and measures to a dataset acquired from Twitter to study emerging semantics in selected streams. The network-theoretic model and the corresponding measures introduced in this paper are relevant for researchers interested in information retrieval and ontology learning from social  awareness streams. Our empirical findings demonstrate that different social awareness stream aggregations exhibit interesting differences, making them amenable for different applications </em>[<a href="#1">1</a>]<em>.</em></p></blockquote>
<p>In the paper, we introduce the notion of <strong>tweetonomies</strong>, and a corresponding tri-partite model of social awareness streams that extends the existing model of folksonomies by accomodating user-generated syntax (such as <a href="http://factoryjoe.com/blog/2009/11/08/new-microsyntax-for-twitter-three-pointers-and-the-slasher/">slashtags</a> and <a href="http://microsyntax.pbworks.com/">other emerging syntax</a>) and thereby integrating the communicative nature of such streams.</p>
<p>In the figure below, we have applied the network-theoretic model of tweetonomies to acquire a semantic network of hashtags that could be used for a range of different purposes, such as for navigating social awareness streams or for recommendation problems.</p>
<div id="attachment_424" class="wp-caption aligncenter" style="width: 481px"><a href="http://mstrohm.files.wordpress.com/2010/04/hashtags_plot.png"><img class="size-full wp-image-424" title="On taxonomies, folksonomies and tweetonomies" src="http://mstrohm.files.wordpress.com/2010/04/tweetonomy-preview.jpg?w=510" alt=""   /></a><p class="wp-caption-text">A tweetonomy of hashtags, aquired from Twitter (with the help of Jan Poeschko, click for full image 2.6 MB)</p></div>
<p>Our work shows that tweetonomies are a far more complex structure than &#8211; for example &#8211; taxonomies or folksonomies. One reason for that observation lies in the dynamic and user-generated nature of its <a href="http://microsyntax.pbworks.com/">syntax</a>, but also in the fact that tweetonomies accomodate a much richer language than the language used in social tagging systems (tweets vs tags).</p>
<p>The results of our work suggest that tweetonomies are a novel and promising concept, different from taxonomies and folksonomies where people engage in conscious acts of classification. Whether tweetonomies have the potential to bring order and structure to social awareness streams similar to the way folksonomies brought order to social tagging systems remains a question to be answered.</p>
<p><span style="color:#ff0000;">Update (May 5 2010):</span> An interesting question that was raised during the presentation of the paper at the WWW&#8217;2010 workshop was whether it would be justified to introduce Tweetonomies as a new concept. In other words, are the structures that we observe on twitter not just a different form of folksonomies? I&#8217;d argue for the necessity of a new concept for the following reasons: While taxonomies and folksonomies emerge when users structure <strong>resources</strong>, tweetonomies emerge when users structure <strong>conversation</strong>. Because conversations are inherently different than resources (e.g. they are dynamic, and involve multiple users) the structures that emerge from social awareness streams (tweetonomies) can be expected to be different from the structures that emerge from social bookmarking systems (folksonomies). Whether this is really the case however needs to be investigated in future work.</p>
<p>References:</p>
<p><a name="1"></a>[1] <a href="http://www.clauwa.info/">C. Wagner</a>, M. Strohmaier, <a href="http://kmi.tugraz.at/staff/markus/documents/2010_SemSearch2010_Tweetonomies.pdf">The Wisdom in Tweetonomies: Acquiring Latent Conceptual Structures from Social Awareness Streams</a>, Semantic Search 2010 Workshop (SemSearch2010), in conjunction with the 19th International World Wide Web Conference (WWW2010), Raleigh, NC, USA, April 26-30, ACM, 2010. (<a href="http://kmi.tugraz.at/staff/markus/documents/2010_SemSearch2010_Tweetonomies.pdf">pdf</a>)</p>
<br />Filed under: <a href='http://mstrohm.wordpress.com/category/research/'>research</a>  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/mstrohm.wordpress.com/412/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/mstrohm.wordpress.com/412/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/mstrohm.wordpress.com/412/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/mstrohm.wordpress.com/412/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/mstrohm.wordpress.com/412/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/mstrohm.wordpress.com/412/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/mstrohm.wordpress.com/412/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/mstrohm.wordpress.com/412/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/mstrohm.wordpress.com/412/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/mstrohm.wordpress.com/412/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/mstrohm.wordpress.com/412/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/mstrohm.wordpress.com/412/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/mstrohm.wordpress.com/412/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/mstrohm.wordpress.com/412/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=412&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://mstrohm.wordpress.com/2010/04/17/on-taxonomies-folksonomies-and-tweetonomies/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">Markus</media:title>
		</media:content>

		<media:content url="http://mstrohm.files.wordpress.com/2010/04/dessert-taxonomy1.jpg?w=102" medium="image">
			<media:title type="html">On taxonomies, folksonomies and tweetonomies</media:title>
		</media:content>

		<media:content url="http://mstrohm.files.wordpress.com/2010/04/tweetonomy-preview.jpg" medium="image">
			<media:title type="html">On taxonomies, folksonomies and tweetonomies</media:title>
		</media:content>
	</item>
		<item>
		<title>Call for Papers: International Workshop on Modeling Social Media 2010 (MSM&#8217;10)</title>
		<link>http://mstrohm.wordpress.com/2010/03/15/cfp-international-workshop-on-modeling-social-media-2010-msm10/</link>
		<comments>http://mstrohm.wordpress.com/2010/03/15/cfp-international-workshop-on-modeling-social-media-2010-msm10/#comments</comments>
		<pubDate>Mon, 15 Mar 2010 09:26:31 +0000</pubDate>
		<dc:creator>Markus Strohmaier</dc:creator>
				<category><![CDATA[events]]></category>
		<category><![CDATA[Call for Papers]]></category>
		<category><![CDATA[CfP]]></category>
		<category><![CDATA[hypertext]]></category>
		<category><![CDATA[mining]]></category>
		<category><![CDATA[modeling]]></category>
		<category><![CDATA[motivation]]></category>
		<category><![CDATA[msm2010]]></category>
		<category><![CDATA[social]]></category>
		<category><![CDATA[social media]]></category>
		<category><![CDATA[twitter]]></category>
		<category><![CDATA[web-science]]></category>
		<category><![CDATA[workshop]]></category>

		<guid isPermaLink="false">http://mstrohm.wordpress.com/?p=400</guid>
		<description><![CDATA[I&#8217;d like to point you to a Call for Papers for a workshop I&#8217;m involved in organizing at Hypertext 2010 in Toronto this June. I&#8217;m really excited about the focus of this event, and I&#8217;m looking forward to lots of exciting discussions and presentations (check out the invited talks and panelists!). International Workshop on Modeling [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=400&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>I&#8217;d like to point you to a Call for Papers for a workshop I&#8217;m involved in organizing at <a href="http://www.ht2010.org/">Hypertext 2010</a> in Toronto this June. I&#8217;m really excited about the focus of this event, and I&#8217;m looking forward to lots of exciting discussions and presentations (check out the invited talks and panelists!).</p>
<p style="text-align:center;">International Workshop on <strong><br />
Modeling Social Media 2010 (MSM&#8217;10)</strong></p>
<p style="text-align:center;"><strong>Website: </strong><a href="http://kmi.tugraz.at/workshop/MSM10/">http://kmi.tugraz.at/workshop/MSM10/</a></p>
<p style="text-align:center;"><img class="aligncenter" title="International Workshop on Modeling Social Media 2010 (MSM'10)" src="http://kmi.tugraz.at/workshop/MSM10/candidate1.jpg" alt="" width="414" height="104" /></p>
<p style="text-align:center;">June 13, 2010, co-located with <a href="http://www.ht2010.org/">Hypertext  2010</a>,<br />
Toronto, Canada</p>
<p><strong>Important Dates:</strong></p>
<p>* Submission Deadline: <span style="color:#ff0000;">April 9, 2010</span><br />
* Notification of Acceptance: May 13, 2010<br />
* Final Papers Due: May 20, 2010<br />
* Workshop date: June 13, 2010, Toronto, Canada</p>
<p><strong><a name="organizers"></a>Workshop Organizers:</strong></p>
<ul>
<li><a href="http://research.nokia.com/people/alvin_chin">Alvin  Chin</a>, Nokia Research Center, Beijing, China, alvin.chin (at)  nokia.com</li>
<li><a href="http://www.is.informatik.uni-wuerzburg.de/staff/hotho/">Andreas  Hotho</a>, University of Wuerzburg, Germany, hotho (at)  informatik.uni-wuerzburg.de</li>
<li><a href="http://kmi.tugraz.at/staff/markus/">Markus  Strohmaier</a>, Graz University of Technology, Austria,  markus.strohmaier (at) tugraz.at</li>
</ul>
<p><strong><a name="organizers"></a>Format:</strong></p>
<p>The workshop will be opened by an invited talk given by <a href="http://www-users.cs.umn.edu/%7Eechi/">Ed Chi</a> (Palo Alto  Research Center). The talk will be followed by a number of peer-reviewed  research and position paper presentations and a discussion panel  including <a href="http://www.chass.utoronto.ca/%7Ewellman/">Barry  Wellman</a> (University of Toronto), <a href="http://people.ischool.berkeley.edu/%7Ehearst/">Marti Hearst</a> (University of California, Berkeley) and <a href="http://www-users.cs.umn.edu/%7Eechi/">Ed Chi</a> (Palo Alto  Research Center).</p>
<div><strong><a name="objectives"></a>Workshop&#8217;s Objectives and Goals:</strong></div>
<p>The goal of this workshop is to focus the attention of researchers on the increasingly important role of modeling social media. The workshop aims to attract and discuss a wide range of modeling perspectives (such as justificative, explanative, descriptive, formative, predictive, etc models) and approaches (statistical modeling, conceptual modeling, temporal modeling, etc). We want to bring together researchers and practitioners with diverse backgrounds interested in 1) exploring different perspectives and approaches to modeling complex social media phenomena and systems, 2) the different purposes and applications that models of social media can serve, 3) issues of integrating and validating social media models and 4) new modeling techniques for social media. The workshop aims to start a dialogue aiming to reflect upon and discuss these issues.</p>
<div><strong>Topics:</strong></div>
<p>Topics may include, but are not limited to:</p>
<p>+ new modeling techniques and approaches for social media<br />
+ models of propagation and influence in twitter, blogs and social tagging systems<br />
+ models of expertise and trust in twitter, wikis, newsgroups, question and answering systems<br />
+ modeling of social phenomena and emergent social behavior<br />
+ agent-based models of social media<br />
+ models of emergent social media properties<br />
+ models of user motivation, intent and goals in social media<br />
+ cooperation and collaboration models<br />
+ software-engineering and requirements models for social media<br />
+ adapting and adaptive hypertext models for social media<br />
+ modeling social media users and their motivations and goals<br />
+ architectural and framework models<br />
+ user modeling and behavioural models<br />
+ modeling the evolution and dynamics of social media</p>
<div><strong><a name="committee"></a>Preliminary Program Committee  (confirmed):</strong></div>
<div>
<ul>
<li> Ansgar Scherp, Koblenz University, Germany<strong> </strong></li>
<li> Roelof van Zwol, Yahoo! Research Barcelona, Spain<strong></strong></li>
<li> Marti Hearst, UC Berkeley, USA</li>
<li> Ed Chi, PARC, USA</li>
<li> Peter Pirolli, PARC, USA<strong></strong></li>
<li>Steffen Staab, Koblenz University, Germany</li>
<li> Barry Wellman, University of Toronto, Canada<strong></strong></li>
<li> Daniel Gayo-Avello, University of Oviedo, Spain<strong></strong></li>
<li> Jordi Cabot, INRIA, France<strong></strong></li>
<li> Pranam Kolari, Yahoo! Research, USA<strong></strong></li>
<li> Tad Hogg, Institute for Molecular Manufacturing, USA<strong></strong></li>
<li> Wai-Tat Fu, University of Illinois at Urbana-Champaign, USA<strong></strong></li>
<li> Thomas Kannampallil, University of Texas, USA</li>
<li> Justin Zhan, Carnegie Mellon University, USA<strong></strong></li>
<li> Marc Smith, ConnectedAction, USA</li>
<li>Mark  Chignell, University of Toronto, Canada</li>
</ul>
<p><strong>Website: </strong><a href="http://kmi.tugraz.at/workshop/MSM10/">http://kmi.tugraz.at/workshop/MSM10/</a></div>
<br />Filed under: <a href='http://mstrohm.wordpress.com/category/events/'>events</a>  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/mstrohm.wordpress.com/400/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/mstrohm.wordpress.com/400/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/mstrohm.wordpress.com/400/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/mstrohm.wordpress.com/400/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/mstrohm.wordpress.com/400/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/mstrohm.wordpress.com/400/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/mstrohm.wordpress.com/400/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/mstrohm.wordpress.com/400/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/mstrohm.wordpress.com/400/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/mstrohm.wordpress.com/400/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/mstrohm.wordpress.com/400/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/mstrohm.wordpress.com/400/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/mstrohm.wordpress.com/400/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/mstrohm.wordpress.com/400/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=400&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://mstrohm.wordpress.com/2010/03/15/cfp-international-workshop-on-modeling-social-media-2010-msm10/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">Markus</media:title>
		</media:content>

		<media:content url="http://kmi.tugraz.at/workshop/MSM10/candidate1.jpg" medium="image">
			<media:title type="html">International Workshop on Modeling Social Media 2010 (MSM&#039;10)</media:title>
		</media:content>
	</item>
		<item>
		<title>WWW&#8217;2010 &#8211; Stop Thinking, Start Tagging: Tag Semantics Emerge From Collaborative Verbosity</title>
		<link>http://mstrohm.wordpress.com/2010/02/12/www2010-stop-thinking-start-tagging-tag-semantics-emerge-from-collaborative-verbosity/</link>
		<comments>http://mstrohm.wordpress.com/2010/02/12/www2010-stop-thinking-start-tagging-tag-semantics-emerge-from-collaborative-verbosity/#comments</comments>
		<pubDate>Fri, 12 Feb 2010 13:28:04 +0000</pubDate>
		<dc:creator>Markus Strohmaier</dc:creator>
				<category><![CDATA[Uncategorized]]></category>
		<category><![CDATA[categorizer]]></category>
		<category><![CDATA[delicious]]></category>
		<category><![CDATA[describer]]></category>
		<category><![CDATA[emergent semantics]]></category>
		<category><![CDATA[intent]]></category>
		<category><![CDATA[tag semantics]]></category>
		<category><![CDATA[tagging]]></category>
		<category><![CDATA[tagging motivation]]></category>
		<category><![CDATA[tagging pragmatics]]></category>
		<category><![CDATA[www2010]]></category>

		<guid isPermaLink="false">http://mstrohm.wordpress.com/?p=386</guid>
		<description><![CDATA[I want to share the abstract of our upcoming paper at WWW&#8217;2010 (here is a link to the full paper). In case you are interested in our research and going to WWW in Raleigh this year as well, I&#8217;d be happy if you&#8217;d get in touch. C. Körner, D. Benz, A. Hotho, M. Strohmaier, G. [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=386&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>I want to share the abstract of our upcoming paper at WWW&#8217;2010 (here is a link to the <a href="http://kmi.tugraz.at/staff/markus/documents/2010_WWW2010_Tagging.pdf">full paper</a>). In case you are interested in our research and going to WWW in Raleigh this year as well, I&#8217;d be happy if you&#8217;d get in touch.</p>
<p>C. Körner, D. Benz, A. Hotho, M. Strohmaier, G. Stumme, <strong>Stop Thinking, Start Tagging: Tag Semantics Emerge From Collaborative Verbosity</strong>, 19th International World Wide Web Conference (WWW2010), Raleigh, NC, USA, April 26-30, ACM, 2010.</p>
<blockquote><p><strong>Abstract: </strong>Recent research provides evidence for the presence of emergent semantics in collaborative tagging systems. While several methods have been proposed, little is known about the factors that influence the evolution of semantic structures in these systems. A natural hypothesis is that the quality of the emergent semantics depends on the pragmatics of tagging: Users with certain usage patterns might contribute more to the resulting semantics than others. In this work, we propose several measures which enable a pragmatic differentiation of taggers by their degree of contribution to emerging semantic structures. We distinguish between categorizers, who typically use a small set of tags as a replacement for hierarchical classification schemes, and describers, who are annotating resources with a wealth of freely associated, descriptive keywords. To study our hypothesis, we apply semantic similarity measures to 64 different partitions of a real-world and large-scale folksonomy containing different ratios of categorizers and describers. Our results not only show that ‘verbose’ taggers are most useful for the emergence  of tag semantics, but also that a subset containing only 40% of the most ‘verbose’ taggers can produce results that match and even outperform the semantic precision obtained from the whole dataset. Moreover, the results suggest that there exists a causal link between the pragmatics of tagging and resulting emergent semantics. This work is relevant for designers and analysts of tagging systems interested (i) in fostering the semantic development of their platforms, (ii) in identifying users introducing “semantic noise”, and (iii) in learning ontologies.</p></blockquote>
<p>More details can be found in the <a href="http://kmi.tugraz.at/staff/markus/documents/2010_WWW2010_Tagging.pdf">full paper</a>.</p>
<p>This work is funded in part by the Know-Center and the FWF Research Grant TransAgere. It is the result of a collaboration with the <a href="http://www.kde.cs.uni-kassel.de/">KDE group</a> at University of Kassel and the  <a href="http://www.is.informatik.uni-wuerzburg.de/staff/hotho/">University of Würzburg</a>. You might  also want to have a look at a <a href="http://bibsonomy.blogspot.com/2010/02/stop-thinking-start-tagging-tag.html">related blog post on the bibsonomy blog</a>.</p>
<p>Some background about the distinction between categorizers and describers can be found in a related paper:</p>
<p><em>M. Strohmaier, C. Koerner, R. Kern,  <strong>Why do Users Tag? Detecting  Users&#8217; Motivation  for Tagging in Social Tagging Systems</strong>, 4th  International  AAAI Conference on Weblogs and Social Media (ICWSM2010),  Washington,  DC, USA, May 23-26, 2010. </em>(<a href="http://kmi.tugraz.at/staff/markus/documents/2010_ICWSM2010_Detecting_Tagging_Motivation.pdf">Download  pdf</a>)</p>
<br />Filed under: <a href='http://mstrohm.wordpress.com/category/uncategorized/'>Uncategorized</a>  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/mstrohm.wordpress.com/386/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/mstrohm.wordpress.com/386/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/mstrohm.wordpress.com/386/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/mstrohm.wordpress.com/386/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/mstrohm.wordpress.com/386/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/mstrohm.wordpress.com/386/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/mstrohm.wordpress.com/386/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/mstrohm.wordpress.com/386/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/mstrohm.wordpress.com/386/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/mstrohm.wordpress.com/386/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/mstrohm.wordpress.com/386/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/mstrohm.wordpress.com/386/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/mstrohm.wordpress.com/386/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/mstrohm.wordpress.com/386/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=386&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://mstrohm.wordpress.com/2010/02/12/www2010-stop-thinking-start-tagging-tag-semantics-emerge-from-collaborative-verbosity/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">Markus</media:title>
		</media:content>
	</item>
		<item>
		<title>Measuring Earthquakes on Twitter: The Twicalli Scale</title>
		<link>http://mstrohm.wordpress.com/2010/01/15/measuring-earthquakes-on-twitter-the-twicalli-scale/</link>
		<comments>http://mstrohm.wordpress.com/2010/01/15/measuring-earthquakes-on-twitter-the-twicalli-scale/#comments</comments>
		<pubDate>Fri, 15 Jan 2010 16:59:59 +0000</pubDate>
		<dc:creator>Markus Strohmaier</dc:creator>
				<category><![CDATA[Uncategorized]]></category>
		<category><![CDATA[california]]></category>
		<category><![CDATA[data mining]]></category>
		<category><![CDATA[earthquake]]></category>
		<category><![CDATA[earthquakes]]></category>
		<category><![CDATA[haiti]]></category>
		<category><![CDATA[social media]]></category>
		<category><![CDATA[twitter]]></category>

		<guid isPermaLink="false">http://mstrohm.wordpress.com/?p=350</guid>
		<description><![CDATA[I got interested in the signal that Twitter received from the two last earthquakes happening in California and Haiti. It has been recently suggested that Twitter can play a role in assessing the magnitude of an earthquake, by studying the stream of tweets that contain a reference to the event, such as the stream of [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=350&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>I got interested in the signal that Twitter received from the two last earthquakes happening in <a href="http://www.reuters.com/article/idUSN0911980620100110">California</a> and <a href="http://www.alertnet.org/thenews/fromthefield/222031/126354623931.htm">Haiti</a>. It has been recently suggested that Twitter can play a role in assessing the magnitude of an earthquake, by studying the stream of tweets that contain a reference to the event, such as the stream of messages related to <a href="http://search.twitter.com/search?q=%23earthquake">#earthquake</a>, including messages like <a href="http://twitter.com/joshperrington/status/7688627649">this</a>. The term &#8220;<strong>Twichter Scale</strong>&#8221; has been used in this context to discuss the relation between Twitter and external events such as earthquakes.</p>
<p>Different people have expressed different ideas about a Twichter Scale, for example:</p>
<blockquote><p><span class="status-body"> <span class="entry-content">Twichter Scale (n): the fraction of Twitter traffic caused by an earthquake. Unused on the east coast. (<a href="http://twitter.com/ian_soboroff/status/7488111821">@ian_soboroff</a>)</span></span></p></blockquote>
<p>While this definition does not necessarily imply that the Twichter scale indicates the magnitude of earthquakes, it is interesting to ask whether Twitter data can be used for that purpose.</p>
<p><a href="http://mstrohm.files.wordpress.com/2010/01/twitter-streams-quake.png"><img class="size-full wp-image-351" title="Measuring Earth Quakes on Twitter" src="http://mstrohm.files.wordpress.com/2010/01/twitter-streams-quake.png?w=510&#038;h=257" alt="" width="510" height="257" /></a></p>
<blockquote>
<div class="mceTemp mceIEcenter">
<dl class="wp-caption aligncenter">
<dd class="wp-caption-dd">Impact of two earthquakes on different Twitter hashtag streams: #earthquake, #earthquakes and #quake between Jan 9 and Jan 15</dd>
</dl>
</div>
</blockquote>
<p>When we look at the data, we can clearly identify both earthquakes represented as spikes in the data. Both earthquakes were comparable in terms of Magnitude (6,5 vs. 7.0 on the Richter Scale). And in fact, both events produced a comparable amplitude for the <a href="http://search.twitter.com/search?q=%23earthquake">#earthquake</a> hashtag stream. On the surface, this might be a confirmation of the idea of a <strong>Twichter Scale</strong>, based on the <strong>Richter Scale</strong>, which is a scale measuring the magnitude of an earthquake. The Richter scale produces the same value for a given earthquake, no matter where you are.</p>
<p>However, there is another, less scientific measure to characterize earthquakes &#8211; the so-called <strong>Mercalli scale</strong> &#8211; which is a measure of an earthquake&#8217;s effect on people and structures.</p>
<p>Which yields to the interesting question, whether Twitter streams can better serve as an indicator of <em>strength </em>(Richter) or <em>impact </em>(Mercalli) of an earthquake?</p>
<p>As we can see in the figure, the amplitude produced on Twitter is approximately equal for both events (almost 400 messages per hour). My suspicion however is, that this is not because Twitter accurately captures the strengths of earthquakes, but because the Jan 9 earthquake was closer to California, where more people (more Twitter users) are willing to share their experiences. So it seems that this produced an amplitude of similar extent, although <em><span style="color:#000000;">the impact of the Jan 9 earthquake in California on structures and people was much weaker than the impact of the Jan 12 earthquake in Haiti</span></em>.</p>
<p>So how can we identify the difference of an earthquake in terms of its impact on people and structures?</p>
<p>When we look at the diagram above, we can see a clear difference after the initial spike: While the Californian earthquake did not cause many follow-up tweets, the aftermath of the Haiti earthquake is clearly visible.</p>
<p>What does that say about Twitter as a signal for earthquakes?</p>
<blockquote>
<ol>
<li>The <strong>amplitude of the signal on Twitter </strong>is very likely biased by the density of Twitter users in a given region, and thereby <strong>can neither give reliable information about the magnitude nor the impact of an earthquake</strong>. This suggests that Twitter can not act as a reliable sensor to detect the magnitude of an earthquake in a &#8220;Richter Scale&#8221; sense.</li>
<li>However, the <strong>&#8220;aftermath&#8221; of a spike on twitter</strong> (the <a href="http://en.wikipedia.org/wiki/Integral">integral</a>) seems to be a good indication of an earthquake&#8217;s <strong>impact on people and structures </strong>- in a &#8220;Mercalli Scale&#8221; sense. Long after the initial spike, the Haiti earthquake is still topic of conversations on Twitter (those are likely related to  fundraising efforts and other related aid activities). Indepentent of the density of Twitter users in Haiti (which is probably low), the aftermath can clearly be identified.</li>
</ol>
</blockquote>
<p><strong>The Twicalli Scale:</strong></p>
<p>This suggests that Twitter as a sensor for the magnitude of earthquakes (in a Richter Scale sense) does not seem very useful. Twitter is more indicative of earthquakes in a &#8220;Twicalli scale&#8221; sense:</p>
<p>Using the <strong>aftermath </strong>(not the amplitude) <strong>of twitter stream data</strong>, the <strong>impact</strong> (not the magnitude) of <strong>earthquakes becomes visible on Twitter</strong>.</p>
<p><em><span style="color:#ff0000;">Update: </span></em><span style="color:#ff0000;"><em>Here are links to further resources and the datasets this analysis is based on:</em></span></p>
<ul>
<li><a href="http://kmi.tugraz.at/staff/markus/datasets/twitter/">Wired article &#8220;</a><a href="http://www.wired.com/wiredscience/2009/12/twitter-earthquake-alerts/">Freaked-Out Tweets After Earthquakes Help Scientists</a>&#8220;</li>
<li><a href="http://epic.cs.colorado.edu/helping_haiti_tweak_the_twe.html">An effort to introduce disaster-specific Twitter Syntax</a> (by the University of Colorado) to coordinate relieve activities</li>
<li><span class="status-body"><span class="entry-content">An interesting paper at <a href="http://www2010.org">WWW2010</a>: &#8220;<a href="http://ymatsuo.com/papers/www2010.pdf">Earthquake Shakes Twitter Users: Real-time Event Detection by Social Sensors (PDF)</a>&#8220;<br />
</span></span></li>
<li>A blog post by Gene Golovchinsky on <a href="http://palblog.fxpal.com/?p=2749">Mechanical Turk, Twitter Syntax and disaster coordination</a></li>
<li><a href="http://kmi.tugraz.at/staff/markus/datasets/twitter/">Archives</a> for hashtagstreams #earthquake, #earthquakes, #quake</li>
</ul>
<p><em><span style="color:#ff0000;">Update II (Aug 27 2010): </span></em><span style="color:#ff0000;"><em>The Twicalli scale was mentioned in a recent paper on the importance of trust in social awareness streams such as Twitter (page 8, left column)</em></span></p>
<p>Marcelo Mendoza, Barbara Poblete and Carlos Castillo, <strong>Twitter Under Crisis: Can we trust what we RT?</strong>, Workshop on Social Media Analytics, In conjunction with the International Conference on Knowledge Discovery &amp; Data Mining (KDD 2010), <a href="http://snap.stanford.edu/soma2010/papers/soma2010_11.pdf">PDF download</a> (see page 8, left column)</p>
<p><em><span style="color:#ff0000;">Update III (Oct 11 2011): Now there&#8217;s also a WWW2011 paper mentioning the Twicalli Scale (page 2, top of right column)</span></em></p>
<p>Carlos Castillo, Marcelo Mendoza, and Barbara Poblete. 2011. <strong>Information credibility on twitter</strong>. In <em>Proceedings of the 20th international conference on World wide web</em> (WWW &#8217;11). ACM, New York, NY, USA, 675-684.</p>
<blockquote>
<div id="_mcePaste" style="overflow:hidden;position:absolute;left:-10000px;top:0;width:1px;height:1px;">http://twitter.com/ian_soboroff/status/7488111821</div>
</blockquote>
<br />Posted in Uncategorized  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/mstrohm.wordpress.com/350/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/mstrohm.wordpress.com/350/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/mstrohm.wordpress.com/350/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/mstrohm.wordpress.com/350/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/mstrohm.wordpress.com/350/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/mstrohm.wordpress.com/350/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/mstrohm.wordpress.com/350/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/mstrohm.wordpress.com/350/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/mstrohm.wordpress.com/350/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/mstrohm.wordpress.com/350/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/mstrohm.wordpress.com/350/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/mstrohm.wordpress.com/350/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/mstrohm.wordpress.com/350/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/mstrohm.wordpress.com/350/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=350&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://mstrohm.wordpress.com/2010/01/15/measuring-earthquakes-on-twitter-the-twicalli-scale/feed/</wfw:commentRss>
		<slash:comments>4</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">Markus</media:title>
		</media:content>

		<media:content url="http://mstrohm.files.wordpress.com/2010/01/twitter-streams-quake.png" medium="image">
			<media:title type="html">Measuring Earth Quakes on Twitter</media:title>
		</media:content>
	</item>
		<item>
		<title>WSDM 2010 List of Accepted Papers</title>
		<link>http://mstrohm.wordpress.com/2009/12/26/wsdm-2010-list-of-accepted-papers/</link>
		<comments>http://mstrohm.wordpress.com/2009/12/26/wsdm-2010-list-of-accepted-papers/#comments</comments>
		<pubDate>Sat, 26 Dec 2009 16:26:14 +0000</pubDate>
		<dc:creator>Markus Strohmaier</dc:creator>
				<category><![CDATA[events]]></category>

		<guid isPermaLink="false">http://mstrohm.wordpress.com/?p=344</guid>
		<description><![CDATA[The list of accepted papers for WSDM 2010 is available now. Lot&#8217;s of exciting papers, I&#8217;m particularly interested in the ones related to tagging, microblogging, search intent and user goals. Here&#8217;s an excerpt of my reading list (including links to pdf-versions whenever they were available): Query Reformulation Using Anchor Text (pdf) Van Dang and Bruce [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=344&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>The <a href="http://www.wsdm-conference.org/2010/accepted-papers.html">list of accepted papers for WSDM 2010</a> is available now. Lot&#8217;s of exciting papers, I&#8217;m particularly interested in the ones related to tagging, microblogging, search intent and user goals. Here&#8217;s an excerpt of my reading list (including links to pdf-versions whenever they were available):</p>
<div>
<ul>
<li>
<div><strong>Query Reformulation Using Anchor Text (<a href="http://ciir-publications.cs.umass.edu/getpdf.php?id=900">pdf</a>)<br />
</strong></div>
<div><em>Van Dang and Bruce Croft</em></div>
</li>
<li>
<div><strong>Tagging Human Knowledge (<a href="http://ilpubs.stanford.edu:8090/878/">technical report</a>)<br />
</strong></div>
<div><em>Paul Heymann, Andreas Paepcke and Hector Garcia-Molina</em></div>
</li>
<li>
<div><strong>Ranking Mechanisms in Twitter-Like Forums (<a href="http://www.cc.gatech.edu/~atish/papers/wsdm357-dassarma.pdf">pdf</a>)<br />
</strong></div>
<div><em>Anish Das Sarma, Atish Das Sarma, Sreenivas Gollapudi and rina panigrahy</em></div>
</li>
<li>
<div><strong>Large Scale Query Log Analysis of Re-Finding (<a href="http://people.csail.mit.edu/teevan/work/publications/papers/wsdm10.pdf">pdf</a>)<br />
</strong></div>
<div><em>Sarah Tyler and Jaime Teevan</em></div>
</li>
<li>
<div><strong>TwitterRank: Finding Topic-sensitive Influential Twitterers (<a href="http://www.mysmu.edu/staff/jsweng/papers/TwitterRank_WSDM.pdf">pdf</a>)<br />
</strong></div>
<div><em>Jianshu Weng, Ee-peng Lim, Jing Jiang and Qi He</em></div>
</li>
<li>
<div><strong>I tag, You tag: Translating tags for advanced user models (<a href="http://vizzdom.com/publications/2010_WSDM_RW_tagtranslation.pdf">pdf</a>)<br />
</strong></div>
<div><em>Robert Wetzker, Carsten Zimmermann and Christian Bauckhage</em></div>
</li>
<li>
<div><strong>Folks in folksonomies: Social link prediction from shared metadata (<a href="http://www.cpt.univ-mrs.fr/~barrat/wsdm141-schifanella.pdf">pdf</a>)<br />
</strong></div>
<div><em>Rossano Schifanella, Alain Barrat, Ciro Cattuto, Benjamin Markines and Filippo Menczer</em></div>
</li>
</ul>
</div>
<p><!-- C.2 SUBCONTENT --></p>
<div><!-- SUBCONTENT CELL --></div>
<br />Posted in events  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/mstrohm.wordpress.com/344/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/mstrohm.wordpress.com/344/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/mstrohm.wordpress.com/344/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/mstrohm.wordpress.com/344/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/mstrohm.wordpress.com/344/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/mstrohm.wordpress.com/344/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/mstrohm.wordpress.com/344/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/mstrohm.wordpress.com/344/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/mstrohm.wordpress.com/344/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/mstrohm.wordpress.com/344/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/mstrohm.wordpress.com/344/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/mstrohm.wordpress.com/344/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/mstrohm.wordpress.com/344/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/mstrohm.wordpress.com/344/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=344&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://mstrohm.wordpress.com/2009/12/26/wsdm-2010-list-of-accepted-papers/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">Markus</media:title>
		</media:content>
	</item>
		<item>
		<title>Open Data for Cities: Enabling Citizens to Have the Apps They Want/Need</title>
		<link>http://mstrohm.wordpress.com/2009/10/08/open-data-for-cities/</link>
		<comments>http://mstrohm.wordpress.com/2009/10/08/open-data-for-cities/#comments</comments>
		<pubDate>Thu, 08 Oct 2009 13:59:09 +0000</pubDate>
		<dc:creator>Markus Strohmaier</dc:creator>
				<category><![CDATA[Uncategorized]]></category>

		<guid isPermaLink="false">http://mstrohm.wordpress.com/?p=332</guid>
		<description><![CDATA[During my recent resarch visit to PARC / the SF Bay Area, I came across a quite impressive iniative by the San Francisco Municipal Government aimed at opening up city data. While I was aware of Obama&#8217;s data.gov initiative on a federal level, opening up municipal data seems to be interesting because in many cases [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=332&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>During my recent resarch visit to <a href="http://www.parc.com/">PARC </a>/ the SF Bay Area, I came across a quite impressive iniative by the <strong>San Francisco </strong>Municipal Government aimed at opening up city data.</p>
<p>While I was aware of Obama&#8217;s <a href="http://www.data.gov/">data.gov</a> initiative on a federal level, opening up municipal data seems to be interesting because in many cases it is closer to people everday&#8217;s concerns, such as finding a parking lot or avoiding areas with high levels of crime.</p>
<p><a href="http://datasf.org/">http://datasf.org</a> is a website related to the San Francisco iniative, aiming to create transparency about the datasets made available by the city so far, such as the <a href="http://www.datasf.org/story.php?title=disabled-parking-blue-zones-">Disabled Parking Blue Zones dataset</a> (<a href="http://gispub02.sfgov.org/website/sfshare/catalog/dpt_bluezones.zip">.zip download</a>). The general idea is to expose municipal data to the public, in order to <em>enable the public to come up with innovations they feel are useful and/or important</em>. Examples of such innovations <a href="http://datasf.org/showcase/">can be found in a showcase</a>, including <a href="http://www.cleanscores.com/">an app for public health scores of SF restaurants</a> or <a href="http://www.mommaps.com/">an iphone application for finding kid-friendly locations in the city</a>.</p>
<p><img class="aligncenter" title="Mom Maps" src="http://datasf.org/showcase/wp-content/uploads/2009/09/sized_mommaps.jpg" alt="" width="240" height="360" /></p>
<p>Brilliant! What is also remarkable about these applications is that these innovations came to the city of San Francisco to no costs other than the costs related to publishing the data. Application development was done by developers who cared for a problem or companies who spotted a business opportunity.</p>
<p>In addition, publishing this data <em>shifts &#8211; to some extent &#8211; responsibility from cities to citizens</em>. If an application does not exist, people can certainly demand it to be provided &#8211; but more importantly &#8211; they can decide to develop it themselves, or organize in a way to get the applications they want developed indepedent of municipal approval.</p>
<p>After some further research, I was excited to see that the city of <strong>Toronto </strong>has a similar initiative, <a href="http://www.toronto.ca/open">http://www.toronto.ca/open</a>. Toronto major David Miller announced it at Mash09 (<a href="http://www.livestream.com/rabbletv/ondemand/flv_3502858424159777971?referrer=mogulus&amp;initthumburl=http://mogulus-user-files.s3.amazonaws.com/chv2rabbletv/2009/04/09/3502858424159777971_690.jpg&amp;playeraspectwidth=4&amp;playeraspectheight=3">watch the video here</a>, the interesting stuff starts at ~12:40).</p>
<p>From a transcript of his speech (<a href="http://visiblegovernment.ca/blog/2009/04/13/toronto-announces-open-data-plan-at-mesh09/">excerpts</a>), David Miller brings the vision of such initiatives nicely to the point:</p>
<blockquote><p><em>I am very pleased to announce today at Mesh09 the development of http://toronto.ca/open, which will be a catalogue of city generated data.  The data will be provided in standardized formats, will be machine readable, and will be updated regularly.  This will be launched in the fall of 2009 with an initial series of data sets, including static data like schedules, and some feeds updated in real time.</em></p>
<p><em>The benefits to the city of Toronto are extremely significant.  Individuals will find new ways to apply this data, improve city services, and expand their reach.  By sharing our information, the public can help us to improve services and create a more liveable city.  And as an open government, sharing data increases our transparency and accountability.</em></p></blockquote>
<p>In his speech, Major Millor also challenged the audience to develop apps that would help the government spot deficiencies and improvement potentials based on the published data (e.g. which contractor fixes reported road damage fastest/sustainably/etc?). Citizens (or better: &#8220;developers&#8221;) can come up with new ways of tapping into the data to develop new and innovative applications that provide unique services to municipal communities.</p>
<p>In <strong>Graz</strong> (<a href="http://en.wikipedia.org/wiki/Graz">Wikipedia</a>), I am currently teaching &#8211; among other courses &#8211; a <a href="http://kmi.tugraz.at/staff/markus/courses/SS2009/707.000_web-science/">course on Web Science</a> at Graz University of Technology,  with more than 100 students per semester. I can see a huge opportunity to combine latest web algorithms, and hands-on experiences on the web with the creative potential of students in order to come up with a vast number of new and innovative applications that could have an exciting impact to the city.</p>
<p>My results of a quick review on related efforts in Graz however have been somewhat disappointing. The only resource I found was the <a href="http://gis.graz.at/cms/ziel/1060687/DE/">GeoDataServer Graz</a> (if you are aware of other resources please post them as a comment!), which provides web interfaces to mostly static, geographic information, such as &#8220;rivers in Graz&#8221; or a &#8220;3D model of Graz&#8221; &#8211; which are fine and exciting examples. But for open data, these initiatives would need to be expanded significantly, to include up-to-date data feeds, APIs, common data representation formats and &#8211; most importantly &#8211; a grande strategy that provides a common vision of how the city wants to go about governing its data. I think this will eventually take place. In any case, I&#8217;m looking forward to getting students excited to participate and contribute to such initiatives, as these iniatives can probably serve as an excellent vehicle to let students have an impact, and at the same time teach them about the importance of service and responsibility in societies.<em> </em></p>
<p style="text-align:left;">This development also nicely ties in with some of my research interests on <em>people&#8217;s motivations on the web</em>: Enabling people to develop and have access to applications <em>they want </em>seems to be a tremendous shortcut to a more goal-oriented, useful, and ultimately more effective web.<em> </em>And with the advent of <a href="http://www.cs.uml.edu/~hgoodell/EndUser/">end user programming</a> and tools such as <a href="http://pipes.yahoo.com/">Yahoo Pipes</a>, there is not even a requirement for users to have lots of programming skills anymore to come up with useful applications or mashups.<em><img class="aligncenter size-full wp-image-206" title="Open Data for Cities: Enabling Citizens to Have the Apps They Want" src="http://mstrohm.files.wordpress.com/2009/04/1x1.png?w=510" alt="Motivations for Tagging: Categorization vs. Description"   /><img class="aligncenter size-full wp-image-206" title="Open Data for Cities: Enabling Citizens to Have the Apps They Want" src="http://mstrohm.files.wordpress.com/2009/04/1x1.png?w=510" alt="Open Data for Cities: Enabling Citizens to Have the Apps They Want"   /><br />
</em></p>
<br />Posted in Uncategorized  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/mstrohm.wordpress.com/332/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/mstrohm.wordpress.com/332/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/mstrohm.wordpress.com/332/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/mstrohm.wordpress.com/332/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/mstrohm.wordpress.com/332/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/mstrohm.wordpress.com/332/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/mstrohm.wordpress.com/332/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/mstrohm.wordpress.com/332/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/mstrohm.wordpress.com/332/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/mstrohm.wordpress.com/332/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/mstrohm.wordpress.com/332/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/mstrohm.wordpress.com/332/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/mstrohm.wordpress.com/332/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/mstrohm.wordpress.com/332/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=332&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://mstrohm.wordpress.com/2009/10/08/open-data-for-cities/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">Markus</media:title>
		</media:content>

		<media:content url="http://datasf.org/showcase/wp-content/uploads/2009/09/sized_mommaps.jpg" medium="image">
			<media:title type="html">Mom Maps</media:title>
		</media:content>

		<media:content url="http://mstrohm.files.wordpress.com/2009/04/1x1.png" medium="image">
			<media:title type="html">Open Data for Cities: Enabling Citizens to Have the Apps They Want</media:title>
		</media:content>

		<media:content url="http://mstrohm.files.wordpress.com/2009/04/1x1.png" medium="image">
			<media:title type="html">Open Data for Cities: Enabling Citizens to Have the Apps They Want</media:title>
		</media:content>
	</item>
		<item>
		<title>Notes on the Relationship between Search and Tagging</title>
		<link>http://mstrohm.wordpress.com/2009/09/13/notes-on-the-relation-between-search-and-tagging/</link>
		<comments>http://mstrohm.wordpress.com/2009/09/13/notes-on-the-relation-between-search-and-tagging/#comments</comments>
		<pubDate>Sun, 13 Sep 2009 18:39:41 +0000</pubDate>
		<dc:creator>Markus Strohmaier</dc:creator>
				<category><![CDATA[goals]]></category>
		<category><![CDATA[intent]]></category>
		<category><![CDATA[search]]></category>
		<category><![CDATA[tagging]]></category>

		<guid isPermaLink="false">http://mstrohm.wordpress.com/?p=319</guid>
		<description><![CDATA[I had a number of exciting and very inspiring conversations this week with Marc, Rakesh, Fabian, Cathy, and Pranam, as well as with Ed and Rowan. It was great talking to everybody and I wanted to share some of the issues that were discussed. Most conversations focused on the role of tagging, and how it [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=319&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>I had a number of exciting and very inspiring conversations this week with <a href="http://research.microsoft.com/en-us/people/najork/">Marc</a>, <a href="http://rakesh.agrawal-family.com/">Rakesh</a>, <a href="http://suchanek.name/">Fabian</a>, <a href="http://www.csdl.tamu.edu/~marshall/">Cathy</a>, and <a href="http://pranamkolari.com/">Pranam</a>, as well as with <a href="http://www.edchi.net/">Ed</a> and Rowan. It was great talking to everybody and I wanted to share some of the issues that were discussed. Most conversations focused on the role of tagging, and how it relates to searching the web. I do not claim that any of these interesting thoughts are mine or that my notes offer answers.  They merely aim to serve as pointers for what I consider important issues.</p>
<p><strong>A minority of resources on the web is tagged:</strong></p>
<p>A number of current research projects study the question how tagged resources can inform/improve search. However, a minority of resources on the web is tagged, and the gap between tagged and non-tagged resources is likely increasing (although this seems difficult to predict cf. <a href="http://heymann.stanford.edu/improvewebsearch.html">Paul Heymann&#8217;s work</a>). This would mean that a decreasing ratio of resources on the web have tagged information associated with it. The question then becomes: Why bother analyzing tagging systems in the first place when their (relative) importance is likely to decrease over time?</p>
<p><strong>Tagged resources exhibit topical bias (that&#8217;s a bad thing!):</strong></p>
<p>Tagging is often a geek activity. I am not aware of any studies of delicious&#8217; user population, but it is likely that delicious&#8217; users are more geeky than the rest of the population. This is a bad thing because it would bias any broad attempt leveraging tagging for search. The bias might depend on the particular tagging system though: Flickr seems to have a much broader, and thereby more representative, user base.</p>
<p><strong>Bookmarks exhibit timely bias (that&#8217;s a good thing!):</strong></p>
<p>Bookmarking typically represents an event <em>in time </em>triggered by some user. Most tagging systems therefore provide timestamp information, allowing to infer more information about the context in which a given resource is being tagged. This allows us to use tagging systems for studying how information on the web is organized, filtered, diffused and consumed.</p>
<p><strong>Search supercedes any other form of information access/organisation:</strong></p>
<p>I found this issue to be the most fundamental and controversial one. How do increasingly sophisticated search engines change the way we interact with information? What is the role that directories (such as Yahoo!) and personal ressource collections (such as &#8220;Favorite folders&#8221;) play in a world where search engines can (re)find much information we require with increasing precision? To give an example: Would an electronic record of all resources that a user has ever visited &#8211; and a corresponding search interface to them &#8211; replace the need for information organization ala delicious or Browser Favorites? (all privacy concerns set aside for a moment). How would such a development relate to the desire of users to share information with friends?</p>
<p><strong>Search intent is poorly understood:</strong></p>
<p>While there has been some work on search queries and query log analysis, the intent behind queries remains largely elusive. Existing distinctions (such as <a href="http://www.sigir.org/forum/F2002/broder.pdf">the one by Broder</a>) need further elaboration and refinement. An example would be what Rakesh called pseudo-navigational queries &#8211; where the user has a certain expectation about the information, but this information can be found on several sites (e.g. wikipedia, an encyclopedia or other sites).</p>
<p><strong>Conflict in tagging systems:</strong></p>
<p>Tagging systems are largely tolerant of conflicts, for example, with regard to tagging semantics. This is different from systems such as wikipedia, where conflict is regarded to be an important aspect of the collaboration process. Twitter seems to lie in between those extremes, where conflict can emerge easily (e.g. around hashtags) , with some rudimentary support for resolution.</p>
<p>I truly enjoyed these conversations, and hope that they will continue at some point in the future.</p>
<br />Posted in goals  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/mstrohm.wordpress.com/319/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/mstrohm.wordpress.com/319/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/mstrohm.wordpress.com/319/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/mstrohm.wordpress.com/319/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/mstrohm.wordpress.com/319/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/mstrohm.wordpress.com/319/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/mstrohm.wordpress.com/319/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/mstrohm.wordpress.com/319/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/mstrohm.wordpress.com/319/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/mstrohm.wordpress.com/319/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/mstrohm.wordpress.com/319/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/mstrohm.wordpress.com/319/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/mstrohm.wordpress.com/319/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/mstrohm.wordpress.com/319/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=319&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://mstrohm.wordpress.com/2009/09/13/notes-on-the-relation-between-search-and-tagging/feed/</wfw:commentRss>
		<slash:comments>6</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">Markus</media:title>
		</media:content>
	</item>
		<item>
		<title>Why we can&#8217;t quit searching in Twitter</title>
		<link>http://mstrohm.wordpress.com/2009/08/19/why-we-cant-quit-searching-in-twitter/</link>
		<comments>http://mstrohm.wordpress.com/2009/08/19/why-we-cant-quit-searching-in-twitter/#comments</comments>
		<pubDate>Wed, 19 Aug 2009 03:07:34 +0000</pubDate>
		<dc:creator>Markus Strohmaier</dc:creator>
				<category><![CDATA[Uncategorized]]></category>
		<category><![CDATA[information foraging]]></category>
		<category><![CDATA[intent]]></category>
		<category><![CDATA[search]]></category>
		<category><![CDATA[twitter]]></category>

		<guid isPermaLink="false">http://mstrohm.wordpress.com/?p=306</guid>
		<description><![CDATA[I&#8217;m still trying to get my head around this recent Slate magazine article on Seeking: How the brain hard-wires us to love Google, Twitter, and texting. And why that&#8217;s dangerous. In this blog post, I&#8217;m basically trying to tie this article on &#8220;Seeking&#8221; together with two related topics: &#8220;Information Foraging&#8221; and &#8220;Twitter&#8221;. Seeking The Slate [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=306&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>I&#8217;m still trying to get my head around this recent <a href="http://www.slate.com/">Slate magazine</a> article on<a href="http://www.slate.com/id/2224932/"> Seeking: How the brain hard-wires us to love Google, Twitter, and texting. And why that&#8217;s dangerous</a>.</p>
<p>In this blog post, I&#8217;m basically trying to tie this article on &#8220;Seeking&#8221; together with two related topics: &#8220;Information Foraging&#8221; and &#8220;Twitter&#8221;.</p>
<h1>Seeking</h1>
<p>The Slate magazine article starts by observing that we (humans) are insatiably curious, and that we gather data even if it gets us into trouble. To give an example:</p>
<blockquote><p>Nina Shen Rastogi confessed in <a href="http://scribe.doublex.com/blog/xxfactor/its-8-am-do-you-know-where-your-childrens-laptops-are" target="_blank"><em><strong>Double X</strong></em></a>, &#8220;<em>My boyfriend has threatened to break up with me if I keep whipping out my iPhone to look up random facts about celebrities when we&#8217;re out to dinner.</em>&#8220;</p></blockquote>
<p>The article goes on making several intertwined arguments which I&#8217;m trying to sort out here.</p>
<p>One of the arguments focuses on reporting how lab rats can be artificially put in &#8220;a constant state of sniffing and foraging&#8221;.  It has been observed in experiments that rats tend to endlessly push a button if the button would stimulate electrodes that are connected to the rat&#8217;s <em>lateral hypothalamus</em>. This gets rats locked into a state of endless repetitive behavior. Scientists have since concluded that the <em>lateral hypothalamus </em>represents the brain&#8217;s pleasure center.</p>
<p>Another point is made based on work by University of Michigan professor of psychology <a href="http://www-personal.umich.edu/%7Eberridge/" target="_blank">Kent Berridge</a> (make sure to check out his website after reading this post) who argues that the mammalian brain has separate systems for <em>wanting </em>and <em>liking</em>. Think of it as the difference between <em>wanting </em>to buy a car, and <em>liking </em>to drive it.</p>
<blockquote><p>Wanting [or seeking] and liking are complementary. The former catalyzes us to action; the latter brings us to a satisfied pause. Seeking needs to be turned off, if even for a little while, so that the system does not run in an endless loop.</p></blockquote>
<p>Interestingly, our brain seems to have evolved into &#8220;being more stingy with mechanisms for pleasure than desire&#8221;: Mammals are rewarded by wanting (as opposed to liking), because creatures that lack motivation (but thrive on pleasure) are likely to lead short lives (due to <a href="http://en.wikipedia.org/wiki/Negative_selection_%28natural_selection%29">negative selection</a>).</p>
<p>There are lab experiments reporting on how the <em>wanting </em>system can take over the <em>liking </em>system. Washington State University neuroscientist <a href="http://www.vetmed.wsu.edu/depts-vcapp/people/Panksepp-endowed.asp" target="_blank">Jaak Panksepp</a> says that &#8220;a way to drive animals into a frenzy is to give them only tiny bits of food which sends their <em>seeking </em>system into hypereactivity.&#8221;</p>
<h1>Information Foraging</h1>
<p>This brings me to a book I&#8217;m currently reading on &#8220;<a href="http://www.amazon.com/Information-Foraging-Theory-Interaction-Human-Technology/dp/0195173325">Information Foraging Theory</a>&#8221; by <a href="http://web.mac.com/peter.pirolli/">Peter Pirolli</a> (I have not finished it yet!). At the beginning, the book argues that the way users search for information can be likened to the way animals forage for food. Information Foraging Theory makes a basic distinction between two types of states a forager is in: <em>between-patch</em> and <em>within-patch</em> states. In <em>between-patch </em>states, foragers are concerned with finding new patches to feed on, whereas in <em>within-patch </em>states, creatures are concerned with consuming a patch. Information Foraging Theory is in part concerned with modeling &#8220;optimal&#8221; strategies for foragers that would maximize some gain (e.g. information value) function, based on the <a href="http://en.wikipedia.org/wiki/Marginal_value_theorem">Marginal Value Theorem</a>, depicted in the illustration below.</p>
<p style="text-align:left;"><img class="aligncenter" title="Marginal Value Theorem" src="http://upload.wikimedia.org/wikipedia/commons/c/ce/Marginalvaluetheorem.jpg" alt="" width="380" height="294" />In this illustration from wikipedia, <em>Transit time</em> refers to <em>between patch </em>(left side) and <em>Time foraging </em>in patch refers to <em>within patch</em> (right side of the diagram). The slope of the tangent corresponds to the <em>optimal rate of gain</em>. There is an interesting relationship between time spent <em>within </em>and <em>between </em>patches. If patches yield very little average gain (e.g. calories, or information value), patches are easily exhausted, quickly putting foragers into the <em>between patch </em>state again.</p>
<h1>Twitter, Seeking and Information Foraging</h1>
<p>Now I&#8217;m trying to tie these two topics together (there might even be a common basis for the relationship between these topics in the literature).</p>
<p><strong>Seeking and Information Foraging: </strong>It seems that <em>wanting </em>and <em>liking </em>systems relate to <em>within </em>and <em>between </em>patch states in Information Foraging Theory. If lab rats push a button in an experiment, it seems that the rat&#8217;s electrodes modify their liking system in a way that prevents them from engaging <em>within a patch</em>, and puts them into a <em>between patch</em> state. When animals are sent into a frenzy by giving them tiny bits of food, <em>within patch </em>time is minimalized, sending them right back into a <em>between patch </em>state. In this scenario, animals spend relatively more time searching than actually consuming food, <em>effectively reducing their overall gain </em>in comparison to scenarios where they would be confronted with large bits of food (higher gain patches).</p>
<p><strong>Finally, how this all might relate to Twitter</strong>: I&#8217;m arguing that Twitter&#8217;s message restriction to 140 characters (disregarding links that might be posted in Twitter messages) artificially reduces <em>within-patch </em>time. The gains of a patch (a tweet) might still vary, but gain is not dependent on within-patch time anymore. The average &#8220;<em>within-patch</em>/gain function&#8221; (right side of the above illustration) seems to be constant! It always takes the same approximate amount to read a tweet (assuming there are no URLs in a tweet), reading &#8220;longer&#8221; does not increase the gain.</p>
<p>In addition, Twitter&#8217;s particular user interface (chronological listing of tweets) seems to be weak in terms of <a href="http://en.wikipedia.org/wiki/Information_foraging#Information_scent">information scent</a>: Judging whether a tweet is relevant or not requires a forager to read the entire tweet, regardless whether the patch (the tweet) contains a gain (an informative value) or not.  This seems to yield to a situation where in systems such as Twitter, users quickly change between <em>within patch</em> (reading a tweet) and <em>between patch </em>(finding the next tweet to read) states<em>. </em>The reason to that might be the following: When a forager has exhausted a patch, he would switch back to a <em>between patch </em>state. However, due to a deprivation of information scent on the Twitter user interface, the user is largely helpless in the <em>between patch </em>state (he does not know where to search next, other than reading the next tweet). This leaves users with a desire to change back to <em>within patch </em>states as quickly as possible (only reading entire tweets can help to assess relevance), thereby potentially adapting chaotic and/or irrational strategies.</p>
<p>The above observation might also explain the frenzy that animals are sent into when being offered tiny bits of food while being deprived of &#8220;scent&#8221; to inform their <em>between patch </em>phases. The hypothesis would be that the frenzy would not occur if the animals were offered clues regarding where the next patch is to be expected, and what gain they could get from exhausting it (of course behavioural biologists might have already studied this question).</p>
<p>Returning to Twitter, it seems that the same effect that sends animals into a frenzy could be at place at Twitter, where users &#8211; due to a combination of small within-patch times and weak information scent &#8211; engage in uninformed foraging of artificially small information patches.</p>
<p>This of course is the provocative conclusion of the Slate Magazine article. What I found interesting is how these three topics &#8211; seeking, information foraging and Twitter &#8211; nicely tie into each other on a theoretical level.</p>
<p>I still have not figured out what a reduction of <em>within patch </em>times <em>alone </em>means from an Information Foraging Theoretic perspective &#8211; I&#8217;d like to figure that out at some point in the future.</p>
<br />Posted in Uncategorized  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/mstrohm.wordpress.com/306/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/mstrohm.wordpress.com/306/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/mstrohm.wordpress.com/306/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/mstrohm.wordpress.com/306/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/mstrohm.wordpress.com/306/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/mstrohm.wordpress.com/306/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/mstrohm.wordpress.com/306/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/mstrohm.wordpress.com/306/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/mstrohm.wordpress.com/306/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/mstrohm.wordpress.com/306/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/mstrohm.wordpress.com/306/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/mstrohm.wordpress.com/306/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/mstrohm.wordpress.com/306/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/mstrohm.wordpress.com/306/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=306&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://mstrohm.wordpress.com/2009/08/19/why-we-cant-quit-searching-in-twitter/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">Markus</media:title>
		</media:content>

		<media:content url="http://upload.wikimedia.org/wikipedia/commons/c/ce/Marginalvaluetheorem.jpg" medium="image">
			<media:title type="html">Marginal Value Theorem</media:title>
		</media:content>
	</item>
		<item>
		<title>List of Social Tagging Datasets</title>
		<link>http://mstrohm.wordpress.com/2009/07/22/list-of-available-social-tagging-datasets/</link>
		<comments>http://mstrohm.wordpress.com/2009/07/22/list-of-available-social-tagging-datasets/#comments</comments>
		<pubDate>Wed, 22 Jul 2009 15:34:22 +0000</pubDate>
		<dc:creator>Markus Strohmaier</dc:creator>
				<category><![CDATA[Uncategorized]]></category>

		<guid isPermaLink="false">http://mstrohm.wordpress.com/?p=302</guid>
		<description><![CDATA[I&#8217;m currently compiling a list of social tagging datasets for our current / future research, but since it might be of interest to others as well I&#8217;m sharing it. Here&#8217;s the link: A non-exhaustive list of Social Tagging Datasets that are available for research If you are aware of other social tagging datasets available for [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=302&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>I&#8217;m currently compiling a list of social tagging datasets for our current / future research, but since it might be of interest to others as well I&#8217;m sharing it. Here&#8217;s the link:</p>
<p><a href="http://kmi.tugraz.at/staff/markus/datasets/">A non-exhaustive list of Social Tagging Datasets that are available for research</a></p>
<p>If you are aware of other social tagging datasets available for research, please let me know by leaving a comment to this post.</p>
<br />Posted in Uncategorized  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/mstrohm.wordpress.com/302/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/mstrohm.wordpress.com/302/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/mstrohm.wordpress.com/302/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/mstrohm.wordpress.com/302/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/mstrohm.wordpress.com/302/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/mstrohm.wordpress.com/302/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/mstrohm.wordpress.com/302/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/mstrohm.wordpress.com/302/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/mstrohm.wordpress.com/302/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/mstrohm.wordpress.com/302/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/mstrohm.wordpress.com/302/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/mstrohm.wordpress.com/302/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/mstrohm.wordpress.com/302/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/mstrohm.wordpress.com/302/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=302&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://mstrohm.wordpress.com/2009/07/22/list-of-available-social-tagging-datasets/feed/</wfw:commentRss>
		<slash:comments>15</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">Markus</media:title>
		</media:content>
	</item>
		<item>
		<title>Motivations for Tagging: Categorization vs. Description</title>
		<link>http://mstrohm.wordpress.com/2009/07/21/motivations-for-tagging-categorization-vs-description/</link>
		<comments>http://mstrohm.wordpress.com/2009/07/21/motivations-for-tagging-categorization-vs-description/#comments</comments>
		<pubDate>Tue, 21 Jul 2009 16:15:05 +0000</pubDate>
		<dc:creator>Markus Strohmaier</dc:creator>
				<category><![CDATA[goals]]></category>
		<category><![CDATA[categorization]]></category>
		<category><![CDATA[description]]></category>
		<category><![CDATA[intent]]></category>
		<category><![CDATA[motivation]]></category>
		<category><![CDATA[tagging]]></category>
		<category><![CDATA[user]]></category>

		<guid isPermaLink="false">http://mstrohm.wordpress.com/?p=294</guid>
		<description><![CDATA[UPDATE March 17 2010: More results can be found in the following publication: M. Strohmaier, C. Koerner, R. Kern, Why do Users Tag? Detecting Users’ Motivation for Tagging in Social Tagging Systems, 4th International AAAI Conference on Weblogs and Social Media (ICWSM2010), Washington, DC, USA, May 23-26, 2010. (Download pdf) In a past post, I [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=294&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p><span style="color:#ff0000;">UPDATE   March 17 2010</span>: More results  can be found in the following  publication: <em>M. Strohmaier, C.   Koerner, R. Kern,  <strong>Why do  Users Tag? Detecting  Users’  Motivation  for Tagging in Social Tagging  Systems</strong>, 4th   International  AAAI Conference on Weblogs and  Social Media (ICWSM2010),   Washington,  DC, USA, May 23-26, 2010. </em>(<a href="http://kmi.tugraz.at/staff/markus/documents/2010_ICWSM2010_Detecting_Tagging_Motivation.pdf">Download   pdf</a>)</p>
<p>In a <a href="http://mstrohm.wordpress.com/2009/04/05/why-do-users-tag-detecting-user-motivation-in-tagging-systems/">past post, I talked about the role of tagging motivation in social tagging systems, and a distinction between users who use tags for Categorization and users who use tags for Description purposes</a>.</p>
<p>One question that is interesting in this context is: &#8220;<em>How do tag clouds of Categorizers respectively Describers actually look like &#8211; and what can we learn from them?</em>&#8220;.</p>
<p><strong>Categorizers vs. Describers: </strong>Our previous work suggests how tag clouds of Categorizers/Describers would look like <em>theoretically</em>: <strong>Categorizers </strong>would rather use general terms for tagging, terms that are useful labels for categories based on his model of the world.  On the other hand, <strong>Describers </strong>would use terms that are specific to a resource or concepts that can be found directly within a resource, based on characteristics of the resource. That&#8217;s the <a href="http://kmi.tugraz.at/staff/markus/documents/2009_ACM_HT09_Understanding_the_motivation_behind_tagging_POSTER.pdf"><em>theory</em></a>.</p>
<p>Christian Körner, one of my PhD students, looked into this question <em>empirically </em>based on his current work, where he applies <a href="http://http://mstrohm.wordpress.com/2009/04/05/why-do-users-tag-detecting-user-motivation-in-tagging-systems/">previously discussed measures to detect tagging motivation (Conditional Tag Entropy and Orphaned Tags) to several tagging datasets</a>. While in reality we expected that most tagging behaviour is the result of a combination of categorization and description motivation, Christian was particulary interested in &#8220;extreme&#8221; cases, i.e. cases of &#8220;extreme&#8221; Categorizers and &#8220;extreme&#8221; Describers. Here are selected results:</p>
<p><strong>Example of an Extreme Categorizer:</strong> Among 445 delicious users, the following screenshot shows the tag cloud of the single user that scored highest on our &#8220;Categorization&#8221; measure (<em>the most extreme Categorizer in our dataset</em>).</p>
<div id="attachment_292" class="wp-caption aligncenter" style="width: 520px"><img class="size-full wp-image-292" title="delicious_categorizer" src="http://mstrohm.files.wordpress.com/2009/07/delicious_categorizer.png?w=510&#038;h=208" alt="delicious_categorizer" width="510" height="208" /><p class="wp-caption-text">An example tag cloud of an &quot;Extreme Categorizer&quot; (based on ~1900 bookmarks)</p></div>
<p>The results are quite intriguing: The above user clearly uses very general terms to annotate his resources, and introduces an elaborated taxonomy to categorize them. While some parts of his vocabulary are more elaborate and fine grained (e.g. &#8220;fashion&#8221; and corresponding sub-categories &#8220;fashion_blog&#8221; and &#8220;fashion_brand&#8221;) others are less elaborated  (e.g. &#8220;games, health, etc&#8221;). The user also produced a controlled vocabulary and sticked to it over the course of 1900 bookmarks, which I think can be seen as another indication for the inclination of this user to use tags for categorization purposes. The fact that a combination of our measures for tagging motivation (Conditional Tag Entropy and Orphaned Tags) has produced this interesting example of an extreme Categorizers provides some evidence for the plausibility of these measures. I think that&#8217;s great news.</p>
<p><strong>Example of an Extreme Describer: </strong>The next screenshot shows an excerpt of a tag cloud of the user that scored highest on the &#8220;Description&#8221; measure (<em>the most extreme Describer in our dataset</em>).</p>
<div id="attachment_293" class="wp-caption aligncenter" style="width: 520px"><img class="size-full wp-image-293" title="delicious_describer" src="http://mstrohm.files.wordpress.com/2009/07/delicious_describer.png?w=510&#038;h=443" alt="delicious_describer" width="510" height="443" /><p class="wp-caption-text">An example tag cloud of an &quot;Extreme Describer&quot; (excerpt, based on ~1700 bookmarks)</p></div>
<p>It is interesting to note that this tag cloud represents an excerpt, the original tag cloud of this user is ~twice this size. The user clearly introduces a large set of tags, and uses many different variations of the same or similiar concepts, without much consideration with regard to terminological or conceptual differences (e.g. exce,  excel, Excel_Functions, Excel2007, Exceler, excelets, ExcelPoster, Excl, excxel). Again, the fact that our measures for tagging motivation produced this particular user as an extreme example of a Describer can be seen as an indicator for the principle plausibility of our measures.</p>
<p>However, what is also apparent from this example is that even in the case of this extreme Describer, some categories seem to be present in his tag vocabulary (e.g. &#8220;ebooks, fun, etc&#8221;). This suggests that a binary approach to understanding tagging motivation (a user is EITHER a Categorizer OR a Describer) is inplausible.</p>
<p><strong>Open Questions: </strong>Overall, the examples of two users motivated by diametrically different motivations for tagging raises a number of interesting questions worth studying: What are characteristics, utilities and properties of tags produced by Categorizers and Describers? How do these different types of tagging motivation influence resulting folksonomies? And how do they influence quality attributes of algorithms (e.g. search, ranking) and applications (e.g. tag recommendation) that are processing folksonomical data? We are looking into some of these questions in our current research.</p>
<p><span style="color:#ff0000;">UPDATE   March 17 2010</span>: More results  can be found in the following  publication: <em>M. Strohmaier, C.   Koerner, R. Kern,  <strong>Why do  Users Tag? Detecting  Users’  Motivation  for Tagging in Social Tagging  Systems</strong>, 4th   International  AAAI Conference on Weblogs and  Social Media (ICWSM2010),   Washington,  DC, USA, May 23-26, 2010. </em>(<a href="http://kmi.tugraz.at/staff/markus/documents/2010_ICWSM2010_Detecting_Tagging_Motivation.pdf">Download   pdf</a>)<img class="aligncenter size-full wp-image-206" title="Motivations for Tagging: Categorization vs. Description" src="http://mstrohm.files.wordpress.com/2009/04/1x1.png?w=510" alt="Motivations for Tagging: Categorization vs. Description"   /></p>
<br />Posted in goals  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/mstrohm.wordpress.com/294/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/mstrohm.wordpress.com/294/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/mstrohm.wordpress.com/294/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/mstrohm.wordpress.com/294/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/mstrohm.wordpress.com/294/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/mstrohm.wordpress.com/294/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/mstrohm.wordpress.com/294/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/mstrohm.wordpress.com/294/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/mstrohm.wordpress.com/294/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/mstrohm.wordpress.com/294/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/mstrohm.wordpress.com/294/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/mstrohm.wordpress.com/294/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/mstrohm.wordpress.com/294/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/mstrohm.wordpress.com/294/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=mstrohm.wordpress.com&amp;blog=2808012&amp;post=294&amp;subd=mstrohm&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://mstrohm.wordpress.com/2009/07/21/motivations-for-tagging-categorization-vs-description/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">Markus</media:title>
		</media:content>

		<media:content url="http://mstrohm.files.wordpress.com/2009/07/delicious_categorizer.png" medium="image">
			<media:title type="html">delicious_categorizer</media:title>
		</media:content>

		<media:content url="http://mstrohm.files.wordpress.com/2009/07/delicious_describer.png" medium="image">
			<media:title type="html">delicious_describer</media:title>
		</media:content>

		<media:content url="http://mstrohm.files.wordpress.com/2009/04/1x1.png" medium="image">
			<media:title type="html">Motivations for Tagging: Categorization vs. Description</media:title>
		</media:content>
	</item>
	</channel>
</rss>
