<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	xmlns:georss="http://www.georss.org/georss" xmlns:geo="http://www.w3.org/2003/01/geo/wgs84_pos#" xmlns:media="http://search.yahoo.com/mrss/"
	>

<channel>
	<title>GigaOM &#187; analytics</title>
	<atom:link href="http://gigaom.com/tag/analytics/feed/" rel="self" type="application/rss+xml" />
	<link>http://gigaom.com</link>
	<description></description>
	<lastBuildDate>Fri, 24 May 2013 06:27:15 +0000</lastBuildDate>
	<language>en</language>
	<sy:updatePeriod>hourly</sy:updatePeriod>
	<sy:updateFrequency>1</sy:updateFrequency>
	<generator>http://wordpress.com/</generator>
<cloud domain='gigaom.com' port='80' path='/?rsscloud=notify' registerProcedure='' protocol='http-post' />
<image>
		<url>http://0.gravatar.com/blavatar/0db8f6557d022075dbbf010c54d46d93?s=96&#038;d=http%3A%2F%2Fs2.wp.com%2Fi%2Fbuttonw-com.png</url>
		<title>GigaOM &#187; analytics</title>
		<link>http://gigaom.com</link>
	</image>
	<atom:link rel="search" type="application/opensearchdescription+xml" href="http://gigaom.com/osd.xml" title="GigaOM" />
	<atom:link rel='hub' href='http://gigaom.com/?pushpress=hub'/>
		<item>
		<title>How big data analytics drives competitive advantage</title>
		<link>http://pro.gigaom.com/report/how-big-data-analytics-drives-competitive-advantage/</link>
		<comments>http://pro.gigaom.com/report/how-big-data-analytics-drives-competitive-advantage/#comments</comments>
		<pubDate>Mon, 20 May 2013 06:55:26 +0000</pubDate>
		<dc:creator>Editor</dc:creator>
				<category><![CDATA[analytics]]></category>
		<category><![CDATA[barack obama]]></category>
		<category><![CDATA[big data]]></category>
		<category><![CDATA[Business Intelligence]]></category>
		<category><![CDATA[CPU technologies]]></category>
		<category><![CDATA[CRM]]></category>
		<category><![CDATA[data management]]></category>
		<category><![CDATA[data warehouse]]></category>
		<category><![CDATA[database management systems]]></category>
		<category><![CDATA[enterprise IT]]></category>
		<category><![CDATA[information technology]]></category>
		<category><![CDATA[Infrastructure optimization]]></category>
		<category><![CDATA[machine-learning]]></category>
		<category><![CDATA[Network performance]]></category>
		<category><![CDATA[rdbms]]></category>
		<category><![CDATA[Relational database]]></category>
		<category><![CDATA[social media]]></category>

		<guid isPermaLink="false">http://pro.gigaom.com/?post_type=go-report&#038;p=176801/</guid>
		<description><![CDATA[Few companies today have the time or the analytics expertise to apply statistics and complex data modeling to regular or even daily business decisions and operations. Now, however, an ecosystem of companies is emerging to fill this need.<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=gigaom.com&#038;blog=14960843&#038;post=648489&#038;subd=gigaom2&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
				<content:encoded><![CDATA[<p>Few companies today have the time or the analytics expertise to apply statistics and complex data modeling to regular or even daily business decisions and operations. Now, however, an ecosystem of companies is emerging to fill this need.</p>
<br />  <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=gigaom.com&#038;blog=14960843&#038;post=648489&#038;subd=gigaom2&#038;ref=&#038;feed=1" width="1" height="1" /><p><a href="http://pubads.g.doubleclick.net/gampad/jump?iu=/1008864/GigaOM_RSS_300x250&#038;sz=300x250&#038;c=30556"><img src="http://pubads.g.doubleclick.net/gampad/ad?iu=/1008864/GigaOM_RSS_300x250&#038;sz=300x250&#038;c=30556" /></a></p><p><strong>Related research and analysis from GigaOM Pro:</strong><br />Subscriber content. <a href="http://pro.gigaom.com/?utm_source=pro&utm_medium=editorial&utm_campaign=auto3&utm_term=648489+how-big-data-analytics-drives-competitive-advantage&utm_content=benwoony">Sign up for a free trial</a>.</p><ul><li><a href="http://pro.gigaom.com/2012/12/big-data-2013-key-trends-and-companies-to-watch/?utm_source=pro&utm_medium=editorial&utm_campaign=auto3&utm_term=648489+how-big-data-analytics-drives-competitive-advantage&utm_content=benwoony">Big data 2013: key trends and companies to watch</a></li><li><a href="http://pro.gigaom.com/2012/04/infrastructure-q1-cloud-and-big-data-woo-the-enterprise/?utm_source=pro&utm_medium=editorial&utm_campaign=auto3&utm_term=648489+how-big-data-analytics-drives-competitive-advantage&utm_content=benwoony">Infrastructure Q1: Cloud and big data woo enterprises</a></li><li><a href="http://pro.gigaom.com/2012/12/sector-roadmap-health-care-and-big-data-in-2012/?utm_source=pro&utm_medium=editorial&utm_campaign=auto3&utm_term=648489+how-big-data-analytics-drives-competitive-advantage&utm_content=benwoony">Health care and big data in 2012</a></li></ul>]]></content:encoded>
			<wfw:commentRss>http://pro.gigaom.com/report/how-big-data-analytics-drives-competitive-advantage/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="http://2.gravatar.com/avatar/b58d6d331ef3725b56f64faa3d21be12?s=96&#38;d=retro&#38;r=PG" medium="image">
			<media:title type="html">benwoony</media:title>
		</media:content>
	</item>
		<item>
		<title>Tableau closes Day 1 as a $2.9B public company, up 64 percent</title>
		<link>http://gigaom.com/2013/05/17/tableau-closes-day-1-as-a-2-9-billion-public-company-up-64-percent/</link>
		<comments>http://gigaom.com/2013/05/17/tableau-closes-day-1-as-a-2-9-billion-public-company-up-64-percent/#comments</comments>
		<pubDate>Fri, 17 May 2013 22:59:24 +0000</pubDate>
		<dc:creator>Derrick Harris</dc:creator>
				<category><![CDATA[analytics]]></category>
		<category><![CDATA[big data]]></category>
		<category><![CDATA[data]]></category>
		<category><![CDATA[ipo]]></category>
		<category><![CDATA[tableau]]></category>
		<category><![CDATA[Visualization]]></category>

		<guid isPermaLink="false">http://gigaom.com/?p=646748</guid>
		<description><![CDATA[Tableau had a successful IPO, closing the trading day up 64 percent and raking in $254 million. CEO Christian Chabot says the company is now set to make itself known around the world.<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=gigaom.com&#038;blog=14960843&#038;post=646748&#038;subd=gigaom2&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
				<content:encoded><![CDATA[<p>Data analytics star Tableau had a successful initial public offering on Friday, <a href="http://data.cnbc.com/quotes/DATA">closing the day up nearly 64 percent</a> at $50.75 per share. That means the company brought in about $254 million (it sold 5 million shares, while stockholders sold 3.4 million) and has a market cap of $2.9 billion. Shares have remained relatively steady in after-hours trading, trending down only slightly.</p>
<p>&#8220;We&#8217;re thrilled,&#8221; Tableau co-founder and CEO Christian Chabot told me during a call after the market closed. One should hope so.</p>
<p>Chabot and his fellow co-founders stand to make a lot of money if today&#8217;s closing price holds up, as does its sole investor NEA. The firm put $15 million into Tableau since it launched in 2003, and has rode that sum to profitability and more than $127 million in annual revenue.</p>
<p>Here&#8217;s a quick chart (made using Tableau Public) showing who owns how many share and what they&#8217;re potentially worth.</p>
<p><a href="http://gigaom2.files.wordpress.com/2013/05/tabipo.jpg"><img src="http://gigaom2.files.wordpress.com/2013/05/tabipo.jpg?w=708&#038;h=443" alt="tabipo" width="708" height="443"  class="aligncenter size-large wp-image-646811" /></a></p>
<p>The company didn&#8217;t really need more capital to operate, Chabot said, but one of the primary drivers was to raise awareness of the company. It has about 12,000 customers, he said, but there are millions more possible users. As part of attracting them, the company is going to expand globally and is working to improve its reach across mobile devices, the cloud and the Mac operating system.</p>
<p>&#8220;I don&#8217;t believe in the this whole &#8216;or&#8217; philosophy with computers,&#8221; Chabot said. &#8220;It&#8217;s &#8216;and&#8217;&#8221; &#8212; meaning people will use desktops and tablets and smartphones.</p>
<p>More prominence and more users singing its praises might also dispel the notion that Tableau is just about visualization. It has some fairly advanced features under the covers (as a commenter <a href="http://gigaom.com/2013/05/16/tableau-prices-its-stock-at-31-per-share-for-fridays-ipo/">to my earlier post</a> about the company&#8217;s influence pointed out), even if they&#8217;re hidden by the relatively simple user experience. </p>
<p>&#8220;Tableau is not a visualization company, per se, it&#8217;s really an analytics company,&#8221; Chabot said.</p>
<p>However, if the company really wants to expand its reach to everyone one who wants to gain knowledge from data &#8212; something Chabot calls a &#8220;timeless human need&#8221; &#8212; <a href="http://gigaom.com/2013/04/07/we-need-a-data-democracy-not-a-benevolent-data-dictatorship/">it might actually need to get simpler</a>. More marketing can let potential business users know about new features like forecasting and data-extraction, but it won&#8217;t make a dentist is Des Moines better at formatting his data.</p>
<p>After raising $254 million in its IPO, though, Tableau is in a good place to do whatever it has to.</p>
<br />  <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=gigaom.com&#038;blog=14960843&#038;post=646748&#038;subd=gigaom2&#038;ref=&#038;feed=1" width="1" height="1" /><p><a href="http://pubads.g.doubleclick.net/gampad/jump?iu=/1008864/GigaOM_RSS_300x250&#038;sz=300x250&#038;c=869458"><img src="http://pubads.g.doubleclick.net/gampad/ad?iu=/1008864/GigaOM_RSS_300x250&#038;sz=300x250&#038;c=869458" /></a></p><p><strong>Related research and analysis from GigaOM Pro:</strong><br />Subscriber content. <a href="http://pro.gigaom.com/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=646748+tableau-closes-day-1-as-a-2-9-billion-public-company-up-64-percent&utm_content=dharrisstructure">Sign up for a free trial</a>.</p><ul><li><a href="http://pro.gigaom.com/2012/01/newnet-q4-platform-mania-and-social-commerce-shakeout/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=646748+tableau-closes-day-1-as-a-2-9-billion-public-company-up-64-percent&utm_content=dharrisstructure">NewNet Q4: Platform mania and social commerce shakeout</a></li><li><a href="http://pro.gigaom.com/2012/01/newnet-q4-platform-mania-and-social-commerce-shakeout/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=646748+tableau-closes-day-1-as-a-2-9-billion-public-company-up-64-percent&utm_content=dharrisstructure">NewNet Q4: Platform mania and social commerce shakeout</a></li><li><a href="http://pro.gigaom.com/2012/05/the-importance-of-putting-the-u-and-i-in-visualization/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=646748+tableau-closes-day-1-as-a-2-9-billion-public-company-up-64-percent&utm_content=dharrisstructure">The importance of putting the U and I in visualization</a></li></ul>]]></content:encoded>
			<wfw:commentRss>http://gigaom.com/2013/05/17/tableau-closes-day-1-as-a-2-9-billion-public-company-up-64-percent/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:thumbnail url="http://gigaom2.files.wordpress.com/2013/05/tabyahoo.png?w=150" />
		<media:content url="http://gigaom2.files.wordpress.com/2013/05/tabyahoo.png?w=150" medium="image">
			<media:title type="html">tabyahoo</media:title>
		</media:content>

		<media:content url="http://0.gravatar.com/avatar/9e48ffa0913f65c577727457dd63023f?s=96&#38;d=retro&#38;r=PG" medium="image">
			<media:title type="html">dharrisstructure</media:title>
		</media:content>

		<media:content url="http://gigaom2.files.wordpress.com/2013/05/tabipo.jpg?w=708" medium="image">
			<media:title type="html">tabipo</media:title>
		</media:content>
	</item>
		<item>
		<title>Tableau prices its stock at $31 per share for Friday&#8217;s IPO</title>
		<link>http://gigaom.com/2013/05/16/tableau-prices-its-stock-at-31-per-share-for-fridays-ipo/</link>
		<comments>http://gigaom.com/2013/05/16/tableau-prices-its-stock-at-31-per-share-for-fridays-ipo/#comments</comments>
		<pubDate>Fri, 17 May 2013 00:03:48 +0000</pubDate>
		<dc:creator>Derrick Harris</dc:creator>
				<category><![CDATA[analytics]]></category>
		<category><![CDATA[big data]]></category>
		<category><![CDATA[Business Intelligence]]></category>
		<category><![CDATA[data]]></category>
		<category><![CDATA[tableau]]></category>
		<category><![CDATA[Visualization]]></category>

		<guid isPermaLink="false">http://gigaom.com/?p=646412</guid>
		<description><![CDATA[Tableau's initial public offering is on Friday, and expectations are high. The company has inspired much of the next-generation analytics space, and how it fares could be telling about just how powerful the data movement is.<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=gigaom.com&#038;blog=14960843&#038;post=646412&#038;subd=gigaom2&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
				<content:encoded><![CDATA[<p><a href="http://www.tableausoftware.com/">Tableau Software</a> has priced shares for its initial public offering on Friday at $31. The company is offering up 5 million shares, while stockholders are offering 3.2 million shares. Tableau co-founder and CEO Christian Chabot will ring the opening bell on the New York Stock Exchange, where the company will list under the symbol &#8220;DATA.&#8221;</p>
<p>That&#8217;s an apt ticker symbol for a company that is in some ways a bellwether for the current fascination with all things data. Tableau isn&#8217;t a big data company, per se, but its visualization software breathes life into many big data calculations. Its <a href="http://gigaom.com/2013/04/07/we-need-a-data-democracy-not-a-benevolent-data-dictatorship/">focus on making software that&#8217;s easy to use</a> and that creates visually captivating charts has turned people from numerous professions into amateur data analysts. (I&#8217;ve even used it in the past, <a href="http://gigaom.com/2011/10/25/google-shows-the-limits-of-a-free-web/">including for the first time</a> in 2011.)</p>
<div id="attachment_646423" class="wp-caption alignright" style="width: 298px"><a href="http://gigaom2.files.wordpress.com/2013/05/und-leadership-christian-small.jpg"><img  alt="Christian Chabot" src="http://gigaom2.files.wordpress.com/2013/05/und-leadership-christian-small.jpg?w=708"   class="size-full wp-image-646423" /></a><p class="wp-caption-text">Christian Chabot</p></div>
<p>As Chabot <a href="http://gigaom.com/2012/02/23/thanks-to-consumerization-its-ipo-season-in-analytics/">told me during a conversation in 2011</a>, &#8220;In any field of human endeavor &#8230; there are a hundred to a thousand more people who understand the data of that field more than they understand reporting and analytics.&#8221;</p>
<p>Anytime you read about a hot new visualization or analytics startup promising the moon, you&#8217;re also seeing the results of what Tableau has sown in terms of the user experience. Many of those same companies will be quick to tell you how limited Tableau&#8217;s capabilities are. It&#8217;s memory-bound, it doesn&#8217;t have a database, it&#8217;s not available in the cloud (or on the Mac operating system), it can&#8217;t do predictive analytics. All true.</p>
<p>Of course, if it raises the kind of capital it expects to by going public, it can build and buy a lot of those capabilities. If pricing stays flat all day Friday, Tableau stands to make $155 million from its 5 million shares. Previous estimates <a href="http://www.forbes.com/sites/tomiogeron/2013/05/16/tableau-software-raises-ipo-price-range/">had Tableau&#8217;s market cap at around $1.7 billion</a> at a price of $29 per share (the company&#8217;s S-1 filing <a href="http://edgar.sec.gov/Archives/edgar/data/1303652/000119312513138700/d469057ds1.htm#rom469057_17">is available here</a>).</p>
<p>If investors have really bought into the company and the concept of a data-driven world, then who knows. Machine-data expert Splunk wnet public in 2012, flying the big data banner, and <a href="http://gigaom.com/2012/04/19/splunk-ipo-kills-lives-up-to-expectations/">saw shares peak at 91 percent above</a> its original asking price of $17.</p>
<p>I&#8217;m not suggesting Tableau is the biggest name in data, or even that it will some day become it. This next-generation analytics field is very young, with startups and larger vendors alike sometimes competing against themselves to win wholly new accounts than trying to displace legacy vendors within large enterprises. And every month, it seems, <a href="http://gigaom.com/2013/05/13/visualization-is-the-future-6-startups-re-imagining-how-we-consume-data/">I come across some new startup</a> that was built with the same principles in mind as Tableau, but with the advantage of having today&#8217;s best practices baked into its software.</p>
<p>But Tableau definitely commands a lot of the mindshare. How it fares as a public company <a href="http://gigaom.com/2013/04/03/a-tableau-ipo-could-validate-the-big-data-visualization-push-or-not/">could be a strong indicator</a> of just how powerful the data movement is, and how well it capitalizes on a new influx of cash will determine how long it stays on the top of customers&#8217; minds.</p>
<p><em>This post was updated at 7:01 p.m. to include previous estimates of the company&#8217;s market capitalization and a link to its S-1 filing.</em></p>
<br />  <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=gigaom.com&#038;blog=14960843&#038;post=646412&#038;subd=gigaom2&#038;ref=&#038;feed=1" width="1" height="1" /><p><a href="http://pubads.g.doubleclick.net/gampad/jump?iu=/1008864/GigaOM_RSS_300x250&#038;sz=300x250&#038;c=213382"><img src="http://pubads.g.doubleclick.net/gampad/ad?iu=/1008864/GigaOM_RSS_300x250&#038;sz=300x250&#038;c=213382" /></a></p><p><strong>Related research and analysis from GigaOM Pro:</strong><br />Subscriber content. <a href="http://pro.gigaom.com/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=646412+tableau-prices-its-stock-at-31-per-share-for-fridays-ipo&utm_content=dharrisstructure">Sign up for a free trial</a>.</p><ul><li><a href="http://pro.gigaom.com/2012/05/the-importance-of-putting-the-u-and-i-in-visualization/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=646412+tableau-prices-its-stock-at-31-per-share-for-fridays-ipo&utm_content=dharrisstructure">The importance of putting the U and I in visualization</a></li><li><a href="http://pro.gigaom.com/2012/03/4-ipad-apps-to-help-wrangle-data/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=646412+tableau-prices-its-stock-at-31-per-share-for-fridays-ipo&utm_content=dharrisstructure">4 iPad apps to help wrangle data</a></li><li><a href="http://pro.gigaom.com/2012/12/sector-roadmap-health-care-and-big-data-in-2012/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=646412+tableau-prices-its-stock-at-31-per-share-for-fridays-ipo&utm_content=dharrisstructure">Health care and big data in 2012</a></li></ul>]]></content:encoded>
			<wfw:commentRss>http://gigaom.com/2013/05/16/tableau-prices-its-stock-at-31-per-share-for-fridays-ipo/feed/</wfw:commentRss>
		<slash:comments>6</slash:comments>
	
		<media:thumbnail url="http://gigaom2.files.wordpress.com/2013/05/products_desktop.jpg?w=150" />
		<media:content url="http://gigaom2.files.wordpress.com/2013/05/products_desktop.jpg?w=150" medium="image">
			<media:title type="html">products_desktop</media:title>
		</media:content>

		<media:content url="http://0.gravatar.com/avatar/9e48ffa0913f65c577727457dd63023f?s=96&#38;d=retro&#38;r=PG" medium="image">
			<media:title type="html">dharrisstructure</media:title>
		</media:content>

		<media:content url="http://gigaom2.files.wordpress.com/2013/05/und-leadership-christian-small.jpg" medium="image">
			<media:title type="html">Christian Chabot</media:title>
		</media:content>
	</item>
		<item>
		<title>This is why big data is the sweet spot for SaaS</title>
		<link>http://gigaom.com/2013/05/14/this-is-why-big-data-is-the-sweet-spot-for-saas/</link>
		<comments>http://gigaom.com/2013/05/14/this-is-why-big-data-is-the-sweet-spot-for-saas/#comments</comments>
		<pubDate>Wed, 15 May 2013 01:10:22 +0000</pubDate>
		<dc:creator>Derrick Harris</dc:creator>
				<category><![CDATA[analytics]]></category>
		<category><![CDATA[big data]]></category>
		<category><![CDATA[BloomReach]]></category>
		<category><![CDATA[Cloud Computing]]></category>
		<category><![CDATA[data science]]></category>
		<category><![CDATA[machine-learning]]></category>
		<category><![CDATA[marketing]]></category>
		<category><![CDATA[natural language processing]]></category>
		<category><![CDATA[saas]]></category>

		<guid isPermaLink="false">http://gigaom.com/?p=645189</guid>
		<description><![CDATA[When it comes to using big data technology effectively, there's a lot to like about SaaS. When companies like BloomReach create and analyze massive web-wide data sets, they automate insights that almost no individual company could discover on its own.<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=gigaom.com&#038;blog=14960843&#038;post=645189&#038;subd=gigaom2&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
				<content:encoded><![CDATA[<p>People often ask me where the smart money is in big data. I often tell them that’s a foolish question, because I’m not an investor — but if I were, I’d look to software as a service.</p>
<p>There are two primary reasons why, the first of which is obvious: Companies are tired of managing applications and infrastructure, so something that optimizes a common task using techniques they don’t know on servers they don’t have to manage is probably compelling. It’s called cloud computing.</p>
<p>The other reason is that <a href="http://gigaom.com/2013/04/29/google-research-director-and-ai-expert-peter-norvig-elected-into-aaas/">the <em>big </em>part of big data really is important</a> if you want to get a really clear picture of what’s happening in any given space. While no single end-user company can (or likely would) address search-engine optimization, for example, by building a massive store comprised of data from hundreds or thousands of companies as well as the entire web, a cloud service dedicated to that specific task can.</p>
<p>From <a href="http://gigaom.com/2012/11/28/log-data-startup-sumo-logic-raises-30m/">web security</a> to <a href="http://gigaom.com/2012/06/21/how-collective-intelligence-is-reshaping-systems-management/">systems management</a>, we’re already seeing how centralized data stores provide SaaS companies a broad view into what’s happening that can then be filtered down to serve each individual customer’s specific situation. <a href="http://www.bloomreach.com/">BloomReach</a>, a SaaS startup that helps companies optimize web-page content, is another good example of this principle in action.</p>
<h2 id="how-do-you-say-cotton-maxi-dre">How do <em>you</em> say, “cotton maxi dress”</h2>
<p>Ideally, BloomReach Head of Marketing Joelle Kaufman told me, the company wants to help customers ensure they get found in web searches by making sure they’re not invisible (buried deep down), irrelevant (not saying anything meaningful on their sites) or incompatible (not speaking their consumers’ language). On Tuesday, the company <a href="http://www.bloomreach.com/buzz/media-center-pr/continuous-quality-management/">announced a new feature called Continuous Quality Management</a>, which lets customers continuously monitor their pages to ensure they’re still featuring the right products and the right terminology. It’s the latest addition to a seemingly useful service that’s built atop a big data foundation few — if any — of its customers would ever attempt to build themselves.</p>
<p>BloomReach is able to help companies optimize their sites because it’s constantly crawling the web in order to figure out how everyone else is describing their content, laying out their pages and structuring their links. Running on the Amazon Web Services cloud, BloomReach runs more than 1,000 Hadoop jobs a day that process about 5 terabytes of data and a billion data points about users’ site behavior. With the latter, co-founder and CTO Ashutosh Garg explained, the company is trying to figure out who’s visiting sites, what they’re doing, how long they’re spending there and how they’re related in terms of behavior.</p>
<p>“You need to have the right amount of data and from the right places before we can do anything with it,” he said. “… It’s a massive machine learning problem.”</p>
<p><a href="http://gigaom2.files.wordpress.com/2013/05/br-stack.png"><img alt="BR stack" src="http://gigaom2.files.wordpress.com/2013/05/br-stack.png?w=708&#038;h=531" width="708" height="531" class="aligncenter size-large wp-image-645359"></a></p>
<p>When you consider all the possible ways something could be described or formatted, the scale of the problem becomes more evident. Simple semantic analysis like associating “desk” and “table” is easy, Garg explained, but what if some wants a lightweight camera and you only have its exact weight listed without any indication of how it compares to other options? What if people searching for “smartphones” really mean “Android phones,” but you’re top-loading your results with BlackBerry phones and Windows phones?</p>
<p>Another of Garg’s hypotheticals has to do with consumers’ presentation biases. If, for example, they’re looking at a lot of websites that look the same or focus on the same things (e.g., megapixels for digital cameras), they’ll expect to see the same things from every site.</p>
<h2 id="10-nonillion-possibilities-cho">10 nonillion possibilities: Choose 1.</h2>
<p>From a sheer numbers perspective, things get even hairier when you’re trying to determine the relationship between any two pages in order to figure out the best path for links to to take. Garg said this is what computer scientists call an <a href="http://en.wikipedia.org/wiki/NP-complete">NP-complete problem</a>, which means the amount of time it takes to process the results is exponentially greater than the amount of content you’re analyzing. So, for example, analyzing 40 pages doesn’t take 10 times as long as analyzing 4 pages, but more like 100 times longer.</p>
<p>Actually, BloomReach CEO Raj De Datta gave me another example of this problem <a href="http://gigaom.com/2012/02/22/bloomreach-wants-to-save-your-site-with-big-data/">when we spoke in early 2012</a>. Here’s how I described it then:</p>
<blockquote id="quote-if-a-company-wants-t"><p>[I]f a company wants to display just 1,000 products across 100 pages, De Datta explained, there are 10-to-the-28th-power (10 octillion) possibilities for how to do that. When it comes time to describe those products, there are 10-to-the-30th-power (10 nonillion) possibilities.</p></blockquote>
<p>If a website has a million pages, Garg said, “it will take you longer than the life of the universe to solve that problem.”</p>
<p>Where this type of problem arises, BloomReach turns to <a href="http://en.wikipedia.org/wiki/Monte_Carlo_method">Monte Carlo simluations</a>, a favorite technique of physicists and Wall Street quants. The method involves running lots of simulations over large data sets in order to determine approximate results in a reasonable time frame. (And if all this isn’t enough computer science and cloud infrastructure for you, I suggest attending our <a href="http://event.gigaom.com/structure/?utm_source=data&amp;utm_medium=editorial&amp;utm_campaign=intext&amp;utm_term=645189+this-is-why-big-data-is-the-sweet-spot-for-saas&amp;utm_content=dharrisstructure">Structure conference</a> in June, which features a who’s who list of speakers, including Google’s Jeff Dean, Facebook’s Jay Parikh and Netflix’s Adrian Cockroft.)</p>
<h2 id="different-queries-different-pa">Different queries, different pages</h2>
<p>Things get even trickier when you’re trying to change the content of web pages in real time as people are searching for things. This isn’t the best method for organic search, where pages need to stay pretty consistent with the indexed versions, but it can be ideal in situations such as paid search and mobile. There are millions of ways to segment buyers, Garg explained, and how accurately you assess their intent and display your content can make the all the difference. Whether someone is a new or repeat visitor often matters, as does whether someone is price-conscious (e.g., the query included “cheap”) or perhaps searching for a particular brand.</p>
<div id="attachment_645358" class="wp-caption aligncenter" style="width: 718px"><a href="http://gigaom2.files.wordpress.com/2013/05/llbean.png"><img alt="Source: BloomReach" src="http://gigaom2.files.wordpress.com/2013/05/llbean.png?w=708&#038;h=531" width="708" height="531" class="size-large wp-image-645358"></a><p class="wp-caption-text">Source: BloomReach</p></div>
<p>Around the holidays, the company actually realized something interesting: The bounce rate on queries for things like “gifts for dad” or “gifts for co-workers” was pretty high, but so was the conversion rate. The time to conversion was relatively fast, as well. It turns out, Garg explained, that people don’t like to overthink certain gifts too much, so if something is presented in a visually appealing manner and is within their price range, they’ll buy.</p>
<p>But creating these types of models involves more than meets the eye. For all the talk about machine learning — and machines do a majority of the work for BloomReach — people also play a critical role. A person might know better than a machine whether something was likely purchased as gift, Garg explained, or they might spot the offensive content on the T-shirt the machine decided was ideal.</p>
<p>“Humans are really good at creativity, thinking through stuff,” he said.</p>
<p>Smart humans are also good at knowing when they’re overmatched, which is why SaaS is so valuable in the big data era. CMOs could try doing what BloomReach or <a href="http://gigaom.com/2012/04/24/datapop-scores-7m-for-custom-built-ads/">similar companies such as DataPop</a> are doing, or they could pay someone to do it much better. Guess which route the smart ones will take.</p>
<p><em>Feature image courtesy of <a href="http://www.shutterstock.com/gallery-54269p1.html">Shutterstock user Andrea Danti</a>.</em></p>
<br />  <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=gigaom.com&#038;blog=14960843&#038;post=645189&#038;subd=gigaom2&#038;ref=&#038;feed=1" width="1" height="1" /><p><a href="http://pubads.g.doubleclick.net/gampad/jump?iu=/1008864/GigaOM_RSS_300x250&#038;sz=300x250&#038;c=864617"><img src="http://pubads.g.doubleclick.net/gampad/ad?iu=/1008864/GigaOM_RSS_300x250&#038;sz=300x250&#038;c=864617" /></a></p><p><strong>Related research and analysis from GigaOM Pro:</strong><br />Subscriber content. <a href="http://pro.gigaom.com/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=645189+this-is-why-big-data-is-the-sweet-spot-for-saas&utm_content=dharrisstructure">Sign up for a free trial</a>.</p><ul><li><a href="http://pro.gigaom.com/2012/03/a-near-term-outlook-for-big-data/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=645189+this-is-why-big-data-is-the-sweet-spot-for-saas&utm_content=dharrisstructure">A near-term outlook for big data</a></li><li><a href="http://pro.gigaom.com/2012/06/cloud-computing-infrastructure-2012-and-beyond/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=645189+this-is-why-big-data-is-the-sweet-spot-for-saas&utm_content=dharrisstructure">Cloud computing infrastructure: 2012 and beyond</a></li><li><a href="http://pro.gigaom.com/2012/04/infrastructure-q1-cloud-and-big-data-woo-the-enterprise/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=645189+this-is-why-big-data-is-the-sweet-spot-for-saas&utm_content=dharrisstructure">Infrastructure Q1: Cloud and big data woo enterprises</a></li></ul>]]></content:encoded>
			<wfw:commentRss>http://gigaom.com/2013/05/14/this-is-why-big-data-is-the-sweet-spot-for-saas/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:thumbnail url="http://gigaom2.files.wordpress.com/2013/05/shutterstock_119782672.jpg?w=150" />
		<media:content url="http://gigaom2.files.wordpress.com/2013/05/shutterstock_119782672.jpg?w=150" medium="image">
			<media:title type="html">collective intelligence</media:title>
		</media:content>

		<media:content url="http://0.gravatar.com/avatar/9e48ffa0913f65c577727457dd63023f?s=96&#38;d=retro&#38;r=PG" medium="image">
			<media:title type="html">dharrisstructure</media:title>
		</media:content>

		<media:content url="http://gigaom2.files.wordpress.com/2013/05/br-stack.png?w=708" medium="image">
			<media:title type="html">BR stack</media:title>
		</media:content>

		<media:content url="http://gigaom2.files.wordpress.com/2013/05/llbean.png?w=708" medium="image">
			<media:title type="html">Source: BloomReach</media:title>
		</media:content>
	</item>
		<item>
		<title>Visualization is the future: 6 startups re-imagining how we consume data</title>
		<link>http://gigaom.com/2013/05/13/visualization-is-the-future-6-startups-re-imagining-how-we-consume-data/</link>
		<comments>http://gigaom.com/2013/05/13/visualization-is-the-future-6-startups-re-imagining-how-we-consume-data/#comments</comments>
		<pubDate>Mon, 13 May 2013 18:20:25 +0000</pubDate>
		<dc:creator>Derrick Harris</dc:creator>
				<category><![CDATA[analytics]]></category>
		<category><![CDATA[Ayasdi]]></category>
		<category><![CDATA[BeyondCore]]></category>
		<category><![CDATA[big data]]></category>
		<category><![CDATA[ClearStory]]></category>
		<category><![CDATA[data]]></category>
		<category><![CDATA[data democratization]]></category>
		<category><![CDATA[Datahero]]></category>
		<category><![CDATA[Platfora]]></category>
		<category><![CDATA[Visualization]]></category>
		<category><![CDATA[Zoomdata]]></category>

		<guid isPermaLink="false">http://gigaom.com/?p=643727</guid>
		<description><![CDATA[If the big data era is really going to revolutionize our world, visualizations that let more people make sense of data will be critical. Here are six startups trying to change how we interact with and look at our data.<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=gigaom.com&#038;blog=14960843&#038;post=643727&#038;subd=gigaom2&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
				<content:encoded><![CDATA[<p>Although visualization is hardly the most technologically challenging part of the data-analysis puzzle, it’s arguably the most important.</p>
<p>Storage, databases, query processing and algorithms are all extremely important — heck, visualization is next to nothing without them — but in a data-driven world where is obsessed with insights, they’re just the foundational layers. They are to big data what server and network configurations are to mobile-app development on <a href="http://gigaom.com/2013/04/25/facebook-acquires-mobile-development-platform-parse/">platforms like Parse</a>. If you’re going to find out new things from massive and highly complex data sets, or <a href="http://gigaom.com/2013/04/07/we-need-a-data-democracy-not-a-benevolent-data-dictatorship/">going to give new types of people the ability to analyze even simple data</a>, the presentation of that data and the ability to create consumable presentations are critical.</p>
<p>With that in mind, here are six startups I’ve seen trying to fundamentally change the way that data is visualized. Some are highly complex under the covers, some are not and none are perfect, but they’re all doing their part to make us rethink what it means to look at data and make spreadsheets and static charts look like relics. (And this list is by no means exhaustive, so feel free to add your favorite visualization tools in the comments.) We’ll be highlighting data visualization at our design-focused RoadMap conference in San Francisco in November (<a href="http://event.gigaom.com/gigaomroadmap/?utm_source=data&amp;utm_medium=editorial&amp;utm_campaign=intext&amp;utm_term=643727+visualization-is-the-future-6-startups-re-imagining-how-we-consume-data&amp;utm_content=dharrisstructure">sign up here</a> to get first access to tickets this Summer).</p>
<h2 id="ayasdi">Ayasdi</h2>
<p>The idea of network graphs isn’t new, but <a href="http://ayasdi.com/">Ayasdi’s</a> approach to it is. Under the covers, there’s an HBase data store, a technique called <del>topographical</del> topological data analysis and hundreds of machine learning algorithms to churn through complex data sets and determine the similarity among the data points. To the end user, though, <a href="http://gigaom.com/2013/01/16/has-ayasdi-turned-machine-learning-into-a-magic-bullet/">there’s a map of the data set that looks a lot like a network graph</a> (only it’s probably not network data) highlighting clusters of related data points that analysts might want to investigate further.</p>
<p><a href="http://gigaom2.files.wordpress.com/2013/05/tcga.png"><img alt="tcga" src="http://gigaom2.files.wordpress.com/2013/05/tcga.png?w=708"   class="aligncenter size-full wp-image-644682"></a></p>
<h2 id="beyondcore">BeyondCORE</h2>
<p><a href="http://beyondcore.com/">BeyondCore</a> actually operates under the same basic premise as Ayasdi — show users the significant correlations so they don’t have to think of the queries that will uncover them — but it uses some different techniques to get there. It uses a different visualization method, too: BeyondCore sticks to standard charts, but actually offers the option of <a href="http://gigaom.com/2012/11/20/a-startup-asks-what-if-you-didnt-have-to-analyze-data-at-all/">having an avatar talk users through the correlations</a> the software has discovered.</p>
<p><a href="http://gigaom2.files.wordpress.com/2013/05/animatedbriefing.jpg"><img alt="animatedbriefing" src="http://gigaom2.files.wordpress.com/2013/05/animatedbriefing.jpg?w=708"   class="aligncenter size-full wp-image-644685"></a></p>
<h2 id="clearstory">ClearStory</h2>
<p><a href="http://www.clearstorydata.com/">ClearStory</a> has a pretty unique product in the works — even if it’s keeping many details and all of its screenshots under lock and key until its formally launches. Essentially, though, <a href="http://gigaom.com/2012/12/05/clearstory-data-raises-9m-and-might-actually-make-data-your-friend/">it’s trying to tell stories via visualizations</a> that display mashups of numerous data sources, update automatically when the source data changes, and invoke collaboration and social concepts. Here’s Co-founder and CEO Sharmila Mulligan explaining the idea behind ClearStory at Structure: Data in March.</p>
<span class="embed-youtube" style="text-align:center; display: block;"><iframe class="youtube-player" type="text/html" width="604" height="370" src="http://www.youtube.com/embed/O62VVrKD1NE?version=3&amp;rel=1&amp;fs=1&amp;showsearch=0&amp;showinfo=1&amp;iv_load_policy=1&amp;wmode=transparent" frameborder="0"></iframe></span>
<h2 id="datahero">Datahero</h2>
<p>Unlike so many data startups, <a href="http://www.datahero.com/">Datahero</a> isn’t trying to woo people fed up with business-intelligence software or the difficulties of getting insights from Hadoop data. Rather, it’s <a href="http://gigaom.com/2013/04/23/visualization-startup-datahero-opens-its-doors-and-delivers-data-analysis-for-the-masses/">trying to let people with simple business or personal data make simple charts</a> without ever having to enter an Excel function or worry too much about how their spreadsheets are formatted. Early on, Datahero’s visualizations are still pretty commonplace (bars, pies, plots, etc.), but it’s the ease of creating them that’s so unique.</p>
<p><a href="http://gigaom2.files.wordpress.com/2013/05/dh-10-e1366704037117.jpg"><img alt="dh-10-e1366704037117" src="http://gigaom2.files.wordpress.com/2013/05/dh-10-e1366704037117.jpg?w=708&#038;h=402" width="708" height="402" class="aligncenter size-full wp-image-644697"></a></p>
<h2 id="platfora">Platfora</h2>
<p><a href="http://platfora.com/">Platfora</a> has undertaken the ambitious task of trying to make analyzing mountains of data stored in Hadoop clusters as easy as analyzing their own <a href="https://stripe.com/">Stripe</a> data might be for developers using Datahero. It’s <a href="http://gigaom.com/2012/10/23/platfora-shows-a-whole-new-way-to-do-business-intelligence-on-big-data/">based on a foundation of Hadoop and massively parallel query processing</a>, but is presented like an HTML5 version of <a href="http://gigaom.com/2013/04/03/a-tableau-ipo-could-validate-the-big-data-visualization-push-or-not/">current visualization golden boy Tableau</a> that’s all about dragging, dropping, and visually slicing and dicing through data. The latter capability is actually critical in a big data world where there are likely more data points than you can ever digest at once.</p>
<p><a href="http://gigaom2.files.wordpress.com/2013/05/explore_slide_4.jpg"><img alt="explore_slide_4" src="http://gigaom2.files.wordpress.com/2013/05/explore_slide_4.jpg?w=708&#038;h=375" width="708" height="375" class="aligncenter size-large wp-image-644705"></a></p>
<h2 id="zoomdata">Zoomdata</h2>
<p><a href="http://www.zoomdata.com/">Zoomdata</a> is far from the only analytics company to support mobile devices, but it’s one of the few I know of (<a href="http://www.roambi.com/analytics-overview.html">Roambi</a> also comes to mind) designed primarily for them. Zoomdata connects to standard business data sources, but takes advantage of touch screens and the D3.js visualization project to offer up some visually interesting charts that are <a href="http://gigaom.com/2012/11/13/heres-how-it-looks-when-big-data-goes-mobile-first/">designed to be manipulated like an artist’s palette</a>.</p>
<p><a href="http://gigaom2.files.wordpress.com/2013/05/ticketstatus_101812.jpg"><img alt="ticketstatus_101812" src="http://gigaom2.files.wordpress.com/2013/05/ticketstatus_101812.jpg?w=708&#038;h=531" width="708" height="531" class="aligncenter size-full wp-image-644709"></a></p>
<br />  <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=gigaom.com&#038;blog=14960843&#038;post=643727&#038;subd=gigaom2&#038;ref=&#038;feed=1" width="1" height="1" /><p><a href="http://pubads.g.doubleclick.net/gampad/jump?iu=/1008864/GigaOM_RSS_300x250&#038;sz=300x250&#038;c=78720"><img src="http://pubads.g.doubleclick.net/gampad/ad?iu=/1008864/GigaOM_RSS_300x250&#038;sz=300x250&#038;c=78720" /></a></p><p><strong>Related research and analysis from GigaOM Pro:</strong><br />Subscriber content. <a href="http://pro.gigaom.com/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=643727+visualization-is-the-future-6-startups-re-imagining-how-we-consume-data&utm_content=dharrisstructure">Sign up for a free trial</a>.</p><ul><li><a href="http://pro.gigaom.com/2012/05/the-importance-of-putting-the-u-and-i-in-visualization/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=643727+visualization-is-the-future-6-startups-re-imagining-how-we-consume-data&utm_content=dharrisstructure">The importance of putting the U and I in visualization</a></li><li><a href="http://pro.gigaom.com/2012/07/cloud-computing-and-trickle-down-analytics/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=643727+visualization-is-the-future-6-startups-re-imagining-how-we-consume-data&utm_content=dharrisstructure">Cloud computing and trickle-down analytics</a></li><li><a href="http://pro.gigaom.com/2012/03/a-near-term-outlook-for-big-data/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=643727+visualization-is-the-future-6-startups-re-imagining-how-we-consume-data&utm_content=dharrisstructure">A near-term outlook for big data</a></li></ul>]]></content:encoded>
			<wfw:commentRss>http://gigaom.com/2013/05/13/visualization-is-the-future-6-startups-re-imagining-how-we-consume-data/feed/</wfw:commentRss>
		<slash:comments>5</slash:comments>
	
		<media:thumbnail url="http://gigaom2.files.wordpress.com/2013/05/tcga.png?w=150" />
		<media:content url="http://gigaom2.files.wordpress.com/2013/05/tcga.png?w=150" medium="image">
			<media:title type="html">tcga</media:title>
		</media:content>

		<media:content url="http://0.gravatar.com/avatar/9e48ffa0913f65c577727457dd63023f?s=96&#38;d=retro&#38;r=PG" medium="image">
			<media:title type="html">dharrisstructure</media:title>
		</media:content>

		<media:content url="http://gigaom2.files.wordpress.com/2013/05/tcga.png" medium="image">
			<media:title type="html">tcga</media:title>
		</media:content>

		<media:content url="http://gigaom2.files.wordpress.com/2013/05/animatedbriefing.jpg" medium="image">
			<media:title type="html">animatedbriefing</media:title>
		</media:content>

		<media:content url="http://gigaom2.files.wordpress.com/2013/05/dh-10-e1366704037117.jpg" medium="image">
			<media:title type="html">dh-10-e1366704037117</media:title>
		</media:content>

		<media:content url="http://gigaom2.files.wordpress.com/2013/05/explore_slide_4.jpg?w=708" medium="image">
			<media:title type="html">explore_slide_4</media:title>
		</media:content>

		<media:content url="http://gigaom2.files.wordpress.com/2013/05/ticketstatus_101812.jpg" medium="image">
			<media:title type="html">ticketstatus_101812</media:title>
		</media:content>
	</item>
		<item>
		<title>SAP renames Visual Intelligence &#8220;Lumira&#8221; and sticks it in the cloud</title>
		<link>http://gigaom.com/2013/05/13/sap-renames-visual-intelligence-lumira-and-sticks-it-in-the-cloud/</link>
		<comments>http://gigaom.com/2013/05/13/sap-renames-visual-intelligence-lumira-and-sticks-it-in-the-cloud/#comments</comments>
		<pubDate>Mon, 13 May 2013 10:53:10 +0000</pubDate>
		<dc:creator>David Meyer</dc:creator>
				<category><![CDATA[analytics]]></category>
		<category><![CDATA[BI]]></category>
		<category><![CDATA[Business Intelligence]]></category>
		<category><![CDATA[BusinessObjects]]></category>
		<category><![CDATA[data visualization]]></category>
		<category><![CDATA[Dropbox]]></category>
		<category><![CDATA[SAP]]></category>
		<category><![CDATA[SAP HANA]]></category>

		<guid isPermaLink="false">http://gigaom.com/?p=644497</guid>
		<description><![CDATA[The software giant's "project Photon" seems to be materializing in the form of Lumira, which promises self-service data visualization in the cloud. It remains to be seen how this can co-exist with SAP's BI OnDemand, though.<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=gigaom.com&#038;blog=14960843&#038;post=644497&#038;subd=gigaom2&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
				<content:encoded><![CDATA[<p>SAP really is <a href="http://gigaom.com/2013/05/07/sap-to-world-were-a-cloud-company-no-really/">pushing hard on this cloud thing</a>. Days after the German business software giant announced plans to put its HANA in-memory database into the cloud, it has done the same with its Visual Intelligence product, now renamed &#8220;Lumira&#8221; (SAP dearly loves renaming its products, and this time it&#8217;s gone for <a href="http://scn.sap.com/community/visual-intelligence/blog/2013/05/10/sap-lumira-why-did-we-change-yet-another-perfectly-good-bi-product-name">&#8220;a more human-friendly yet Google-ready name&#8221;</a>).</p>
<p><a href="http://www54.sap.com/pc/analytics/business-intelligence/software/data-visualization/cloud.html">Lumira Cloud</a> supposedly gives SAP an answer to the <a href="http://gigaom.com/2013/04/07/we-need-a-data-democracy-not-a-benevolent-data-dictatorship/">recent explosion</a> in the cloud-based, self-service data visualization offerings. The HTML5-built BI service comes with a &#8220;monthly&#8221; subscription fee (albeit one that can only be ordered in annual chunks) and lets its users publish and share data visualizations with one another for viewing or editing on desktop or mobile devices.</p>
<p>SAP Lumira Cloud appears to be more an Dropbox-ish add-on for the desktop version of Lumira than a cloud-based replacement, but it does also allow the creation of datasets from Excel documents. The service, which integrates with on-premise data and naturally supports HANA, can also be used to share SAP BusinessObjects Design Studio files and SAP Crystal Reports documents.</p>
<p>This release appears to be the culmination of what SAP has been previously <a href="http://scn.sap.com/community/business-intelligence/blog/2013/04/08/cloud-analytics-is-all-smoke-and-no-fire">referring to as &#8220;project Photon&#8221;</a> – supposedly the company&#8217;s &#8220;true departmental self-service BI offering.&#8221; The issue here, of course, is the monumental and somewhat confusing nature of the company&#8217;s portfolio. After all, doesn&#8217;t SAP already do this SME-courting, departmental analytics stuff through its BusinessObjects BI OnDemand product?</p>
<p>Try visiting <a href="www.sap.com/solutions/sapbusinessobjects/ondemand/‎">at least one</a> of the BI OnDemand product pages and you&#8217;ll be taken through to the Lumira page. Look at the <a href="http://scn.sap.com/docs/DOC-41354">Lumira Cloud FAQs</a> and you&#8217;ll be told that BI OnDemand will continue to run &#8220;in parallel&#8221; to Lumira Cloud, but also that OnDemand customers can contact their account representative &#8220;to discuss the best timing and strategy&#8221; for migrating to the new service.</p>
<p>Perhaps this less-than-clear situation presages a simplification of SAP&#8217;s portfolio – no doubt more will be revealed at the company&#8217;s SAPPHIRE NOW conference this week. If it doesn&#8217;t, customers in search of next-generation data visualization tools have <a href="http://gigaom.com/2013/04/07/we-need-a-data-democracy-not-a-benevolent-data-dictatorship/">many far more straightforward options</a> to check out.</p>
<br />  <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=gigaom.com&#038;blog=14960843&#038;post=644497&#038;subd=gigaom2&#038;ref=&#038;feed=1" width="1" height="1" /><p><a href="http://pubads.g.doubleclick.net/gampad/jump?iu=/1008864/GigaOM_RSS_300x250&#038;sz=300x250&#038;c=203684"><img src="http://pubads.g.doubleclick.net/gampad/ad?iu=/1008864/GigaOM_RSS_300x250&#038;sz=300x250&#038;c=203684" /></a></p><p><strong>Related research and analysis from GigaOM Pro:</strong><br />Subscriber content. <a href="http://pro.gigaom.com/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=644497+sap-renames-visual-intelligence-lumira-and-sticks-it-in-the-cloud&utm_content=superglaze">Sign up for a free trial</a>.</p><ul><li><a href="http://pro.gigaom.com/2012/12/big-data-2013-key-trends-and-companies-to-watch/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=644497+sap-renames-visual-intelligence-lumira-and-sticks-it-in-the-cloud&utm_content=superglaze">Big data 2013: key trends and companies to watch</a></li><li><a href="http://pro.gigaom.com/2012/04/sector-roadmap-hadoop-platforms-2012/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=644497+sap-renames-visual-intelligence-lumira-and-sticks-it-in-the-cloud&utm_content=superglaze">2012: The Hadoop infrastructure market booms</a></li><li><a href="http://pro.gigaom.com/2012/04/infrastructure-q1-cloud-and-big-data-woo-the-enterprise/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=644497+sap-renames-visual-intelligence-lumira-and-sticks-it-in-the-cloud&utm_content=superglaze">Infrastructure Q1: Cloud and big data woo enterprises</a></li></ul>]]></content:encoded>
			<wfw:commentRss>http://gigaom.com/2013/05/13/sap-renames-visual-intelligence-lumira-and-sticks-it-in-the-cloud/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:thumbnail url="http://gigaom2.files.wordpress.com/2013/05/sap-lumira.jpg?w=150" />
		<media:content url="http://gigaom2.files.wordpress.com/2013/05/sap-lumira.jpg?w=150" medium="image">
			<media:title type="html">SAP Lumira</media:title>
		</media:content>

		<media:content url="http://0.gravatar.com/avatar/6599daccfd7e897e68744fe0065e5a2e?s=96&#38;d=retro&#38;r=PG" medium="image">
			<media:title type="html">superglaze</media:title>
		</media:content>
	</item>
		<item>
		<title>How data warehousing is now a cost-effective solution for businesses</title>
		<link>http://pro.gigaom.com/report/the-new-economics-of-enterprise-data-warehousing/</link>
		<comments>http://pro.gigaom.com/report/the-new-economics-of-enterprise-data-warehousing/#comments</comments>
		<pubDate>Mon, 13 May 2013 06:55:34 +0000</pubDate>
		<dc:creator>nraden</dc:creator>
				<category><![CDATA[Uncategorized]]></category>
		<category><![CDATA[ADAPA]]></category>
		<category><![CDATA[analytics]]></category>
		<category><![CDATA[apache-hadoop]]></category>
		<category><![CDATA[big data]]></category>
		<category><![CDATA[Business Intelligence]]></category>
		<category><![CDATA[clickstream analytics]]></category>
		<category><![CDATA[Cloud Computing]]></category>
		<category><![CDATA[cloud-infrastructure]]></category>
		<category><![CDATA[columnar databases]]></category>
		<category><![CDATA[data]]></category>
		<category><![CDATA[data analysis]]></category>
		<category><![CDATA[data management]]></category>
		<category><![CDATA[data storage]]></category>
		<category><![CDATA[data warehouse]]></category>
		<category><![CDATA[data warehousing]]></category>
		<category><![CDATA[data-analytics]]></category>
		<category><![CDATA[database]]></category>
		<category><![CDATA[database technology]]></category>
		<category><![CDATA[Database theory]]></category>
		<category><![CDATA[distributed processing]]></category>
		<category><![CDATA[EMC]]></category>
		<category><![CDATA[etl]]></category>
		<category><![CDATA[extraction transform load systems]]></category>
		<category><![CDATA[Ferrari]]></category>
		<category><![CDATA[file systems]]></category>
		<category><![CDATA[Greenplum]]></category>
		<category><![CDATA[Hadoop]]></category>
		<category><![CDATA[HDFS]]></category>
		<category><![CDATA[Hewlett-Packard]]></category>
		<category><![CDATA[high-speed technologies]]></category>
		<category><![CDATA[HP]]></category>
		<category><![CDATA[IBM]]></category>
		<category><![CDATA[information technology]]></category>
		<category><![CDATA[integrated circuit]]></category>
		<category><![CDATA[Linux]]></category>
		<category><![CDATA[Mapr]]></category>
		<category><![CDATA[mobile devices]]></category>
		<category><![CDATA[Moore's Law]]></category>
		<category><![CDATA[Netezza]]></category>
		<category><![CDATA[Open Source Software]]></category>
		<category><![CDATA[parallel processing]]></category>
		<category><![CDATA[relational-databases]]></category>
		<category><![CDATA[scalability]]></category>
		<category><![CDATA[social networks]]></category>
		<category><![CDATA[storage devices]]></category>
		<category><![CDATA[storage virtualization technologies]]></category>
		<category><![CDATA[System administration]]></category>
		<category><![CDATA[tco]]></category>
		<category><![CDATA[total-cost-of-ownership]]></category>
		<category><![CDATA[Transaction processing]]></category>
		<category><![CDATA[Truviso]]></category>
		<category><![CDATA[Vertica]]></category>
		<category><![CDATA[Virtualization technology]]></category>

		<guid isPermaLink="false">http://pro.gigaom.com/?post_type=go-report&#038;p=175747/</guid>
		<description><![CDATA[Data-warehouse providers are quickly adding Hadoop distributions, or even their own versions of Hadoop, into their architecture, adding further cost advantages to collections of extremely large data sets. Finding the talent to manage this newly converged environment will not be easy, but it presents tremendous opportunity for companies willing to take some risk.<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=gigaom.com&#038;blog=14960843&#038;post=648494&#038;subd=gigaom2&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
				<content:encoded><![CDATA[<p>The new economics of data warehousing provide attractive alternatives in both costs and benefits. While big data gets most of the attention, evolved data warehousing will play an important role for the foreseeable future. In order to be relevant, data-warehouse design and operation need to be simplified, taking advantage of greatly improved hardware, software, and methods.</p>
<br />  <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=gigaom.com&#038;blog=14960843&#038;post=648494&#038;subd=gigaom2&#038;ref=&#038;feed=1" width="1" height="1" /><p><a href="http://pubads.g.doubleclick.net/gampad/jump?iu=/1008864/GigaOM_RSS_300x250&#038;sz=300x250&#038;c=969507"><img src="http://pubads.g.doubleclick.net/gampad/ad?iu=/1008864/GigaOM_RSS_300x250&#038;sz=300x250&#038;c=969507" /></a></p><p><strong>Related research and analysis from GigaOM Pro:</strong><br />Subscriber content. <a href="http://pro.gigaom.com/?utm_medium=editorial&utm_campaign=auto3&utm_term=648494+the-new-economics-of-enterprise-data-warehousing&utm_content=nraden">Sign up for a free trial</a>.</p><ul><li><a href="http://pro.gigaom.com/2012/04/infrastructure-q1-cloud-and-big-data-woo-the-enterprise/?utm_medium=editorial&utm_campaign=auto3&utm_term=648494+the-new-economics-of-enterprise-data-warehousing&utm_content=nraden">Infrastructure Q1: Cloud and big data woo enterprises</a></li><li><a href="http://pro.gigaom.com/2012/07/cloud-and-data-second-quarter-2012-analysis-and-outlook-2/?utm_medium=editorial&utm_campaign=auto3&utm_term=648494+the-new-economics-of-enterprise-data-warehousing&utm_content=nraden">Takeaways from the second quarter in cloud and data</a></li><li><a href="http://pro.gigaom.com/2011/04/infrastructure-q1-iaas-comes-down-to-earth-big-data-takes-flight/?utm_medium=editorial&utm_campaign=auto3&utm_term=648494+the-new-economics-of-enterprise-data-warehousing&utm_content=nraden">Infrastructure Q1: IaaS Comes Down to Earth; Big Data Takes Flight</a></li></ul>]]></content:encoded>
			<wfw:commentRss>http://pro.gigaom.com/report/the-new-economics-of-enterprise-data-warehousing/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:thumbnail url="https://gigaom-pro-files.s3.amazonaws.com/files/2012/08/datacenter1.jpg?w=150" />
		<media:content url="https://gigaom-pro-files.s3.amazonaws.com/files/2012/08/datacenter1.jpg?w=150" medium="image">
			<media:title type="html">datacenter1</media:title>
		</media:content>

		<media:content url="http://0.gravatar.com/avatar/fdbbd80432b14e9d84aa12c6fc0cce24?s=96&#38;d=retro&#38;r=PG" medium="image">
			<media:title type="html">nraden</media:title>
		</media:content>
	</item>
		<item>
		<title>ScraperWiki lets anyone scrape Twitter data without coding</title>
		<link>http://gigaom.com/2013/05/10/scraperwiki-lets-anyone-scrape-twitter-data-without-coding/</link>
		<comments>http://gigaom.com/2013/05/10/scraperwiki-lets-anyone-scrape-twitter-data-without-coding/#comments</comments>
		<pubDate>Fri, 10 May 2013 21:38:00 +0000</pubDate>
		<dc:creator>Derrick Harris</dc:creator>
				<category><![CDATA[analytics]]></category>
		<category><![CDATA[data]]></category>
		<category><![CDATA[data democratization]]></category>
		<category><![CDATA[Many Eyes]]></category>
		<category><![CDATA[ScraperWiki]]></category>
		<category><![CDATA[sentiment analysis]]></category>
		<category><![CDATA[text analysis]]></category>
		<category><![CDATA[Twitter data]]></category>
		<category><![CDATA[Visualization]]></category>
		<category><![CDATA[web scraping]]></category>

		<guid isPermaLink="false">http://gigaom.com/?p=644137</guid>
		<description><![CDATA[A new beta version of ScraperWiki makes it easy to relatively easy to scrape Twitter for certain phrases and get to work analyzing the data. It's just one more way that data analysis is getting democratized.<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=gigaom.com&#038;blog=14960843&#038;post=644137&#038;subd=gigaom2&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
				<content:encoded><![CDATA[<p>The Obama administration&#8217;s <a href="http://gigaom.com/2013/05/09/the-white-house-opens-the-data-floodgates-and-now-the-real-work-will-begin/">open data mandate</a> announced on Thursday was made all the better by the <a href="http://blog.scraperwiki.com/2013/05/10/free-community-accounts/">unveiling of the new ScraperWiki service </a>on Friday. If you&#8217;re not familiar with <a href="https://scraperwiki.com/">ScraperWiki</a>, it&#8217;s a web-scraping service that has been around for a while but has primarily focused on users with some coding chops or data journalists willing to pay to have someone scrape data sets for them. Its new service, though, currently in beta, also makes it possible for anyone to scrape Twitter to create a custom data set without having to write a single line of code.</p>
<p>Taken alone, ScraperWiki isn&#8217;t that big of a deal, but it&#8217;s part of a huge revolution that has been <a href="http://gigaom.com/2013/04/07/we-need-a-data-democracy-not-a-benevolent-data-dictatorship/">called the democratization of data</a>. More data is becoming available all the time &#8212; whether from the government, corportations or even our own lives &#8212; only it&#8217;s not of much use unless you&#8217;re able to do something with it. ScraperWiki is now one of a growing list of tools dedicated to helping everyone, not just expert data analysts or coders, analyze &#8212; and, in its case, generate &#8212; the data that matters to them.</p>
<p>After noticing a particularly large numbers of tweets in my stream about flight delays yesterday, I thought I&#8217;d test out ScraperWiki&#8217;s new Twitter search function by gathering a bunch of tweets directed to @United. The results &#8212; from 1,697 tweets dating back to May 3 &#8212; are pretty fun to play with, if not that surprising. (Also, I have no idea how far back the tweet search will go or how long it will take using the free account, which is limited to 30 minutes of compute time a day. I just stopped at some point so I could start digging in.)</p>
<p>First things first, I ran my query. Here&#8217;s what the data looks like viewed in a table in the ScraperWiki app.</p>
<p><a href="http://gigaom2.files.wordpress.com/2013/05/sw1.jpg"><img  alt="sw1" src="http://gigaom2.files.wordpress.com/2013/05/sw1-e1368211547401.jpg?w=708&#038;h=350" width="708" height="350" class="aligncenter size-large wp-image-644242" /></a></p>
<p>Next, it&#8217;s a matter of analyzing it. ScraperWiki lets you view it in a table (like above), export it to Excel or query it using SQL, and will also summarize it for you. This being Twitter data, the natural thing to do seemed to be analyzing it for sentiment. One simple way to do this right inside the ScraperWiki table is to search for a particular term that might suggest joy or anger. I chose a certain four-letter word that begins with <em>f.</em></p>
<p>Surprisingly, I only found eight instances. Here&#8217;s my favorite: &#8220;Your Customer Service is better than a hooker. I paid a bunch of money and you&#8217;re still&#8230;&#8221; (You probably get the idea.)</p>
<p>But if you read <a href="http://gigaom.com/2013/01/31/data-for-dummies-5-data-analysis-tools-anyone-can-use/">my &#8220;data for dummies&#8221; post</a> from January, you know that we mere mortals have tools at our disposal for dealing with text data in a more refined way. IBM&#8217;s Many Eyes service won&#8217;t let me score tweets for sentiment, but I can get a pretty good idea overall by looking at how words are used. For this job, though, a simple word cloud won&#8217;t work, even after filtering out common words, @united and other obvious terms. Think of how &#8220;thanks&#8221; can be used sarcastically and you can see why.</p>
<p>Using the customized word tree, you can see that &#8220;thanks&#8221; sometimes means &#8220;thanks.&#8221; Other times, not so much. I know it&#8217;s easy to dwell on the negative, but consider this: &#8220;worst&#8221; had 28 hits while &#8220;best&#8221; had 15. One of those was referring to Tito&#8217;s vodka and at least three were referring to skyline views. (<a href="http://www-958.ibm.com/software/analytics/manyeyes/visualizations/thanks">Click here to access it</a> and search by whatever word you want.)</p>
<p><a href="http://gigaom2.files.wordpress.com/2013/05/sw2.jpg"><img  alt="sw2" src="http://gigaom2.files.wordpress.com/2013/05/sw2.jpg?w=708&#038;h=399" width="708" height="399" class="aligncenter size-large wp-image-644258" /></a></p>
<p><a href="http://www-958.ibm.com/software/analytics/manyeyes/visualizations/for-2">Here&#8217;s a phrase net</a> filtering the results by phrases where the word &#8220;for&#8221; connects two words.</p>
<p><a href="http://gigaom2.files.wordpress.com/2013/05/sw3.jpg"><img  alt="sw3" src="http://gigaom2.files.wordpress.com/2013/05/sw3.jpg?w=708&#038;h=337" width="708" height="337" class="aligncenter size-large wp-image-644267" /></a></p>
<p>Anyhow, this was just a fast, simple and fairly crude example of what ScraperWiki now allows users to do, and how that resulting data can be combined with other tools to analyze and visualize it. Obviously, it&#8217;s more powerful if you can code, but new tools are supposedly on the way (remember, this is just a beta version) that should make it easier to scrape data from even more sources.</p>
<p>In the long term, though, services like ScraperWiki should become a lot more valuable as tools for helping us generate and analyze data rather than just believe what we&#8217;re told. Want to improve your small business, put your life in context or perhaps just write the best book report your teacher has ever seen? It&#8217;s getting easier every day.</p>
<br />  <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=gigaom.com&#038;blog=14960843&#038;post=644137&#038;subd=gigaom2&#038;ref=&#038;feed=1" width="1" height="1" /><p><a href="http://pubads.g.doubleclick.net/gampad/jump?iu=/1008864/GigaOM_RSS_300x250&#038;sz=300x250&#038;c=258150"><img src="http://pubads.g.doubleclick.net/gampad/ad?iu=/1008864/GigaOM_RSS_300x250&#038;sz=300x250&#038;c=258150" /></a></p><p><strong>Related research and analysis from GigaOM Pro:</strong><br />Subscriber content. <a href="http://pro.gigaom.com/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=644137+scraperwiki-lets-anyone-scrape-twitter-data-without-coding&utm_content=dharrisstructure">Sign up for a free trial</a>.</p><ul><li><a href="http://pro.gigaom.com/2012/04/aws-storage-gateway-jolts-cloud-storage-ecosystem/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=644137+scraperwiki-lets-anyone-scrape-twitter-data-without-coding&utm_content=dharrisstructure">AWS Storage Gateway jolts cloud-storage ecosystem</a></li><li><a href="http://pro.gigaom.com/2012/03/4-ipad-apps-to-help-wrangle-data/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=644137+scraperwiki-lets-anyone-scrape-twitter-data-without-coding&utm_content=dharrisstructure">4 iPad apps to help wrangle data</a></li><li><a href="http://pro.gigaom.com/2010/10/will-hadoop-vendors-profit-from-banks-big-data-woes/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=644137+scraperwiki-lets-anyone-scrape-twitter-data-without-coding&utm_content=dharrisstructure">Will Hadoop Vendors Profit from Banks&#8217; Big Data Woes?</a></li></ul>]]></content:encoded>
			<wfw:commentRss>http://gigaom.com/2013/05/10/scraperwiki-lets-anyone-scrape-twitter-data-without-coding/feed/</wfw:commentRss>
		<slash:comments>3</slash:comments>
	
		<media:thumbnail url="http://gigaom2.files.wordpress.com/2013/05/tweetsearch.jpg?w=150" />
		<media:content url="http://gigaom2.files.wordpress.com/2013/05/tweetsearch.jpg?w=150" medium="image">
			<media:title type="html">tweetsearch</media:title>
		</media:content>

		<media:content url="http://0.gravatar.com/avatar/9e48ffa0913f65c577727457dd63023f?s=96&#38;d=retro&#38;r=PG" medium="image">
			<media:title type="html">dharrisstructure</media:title>
		</media:content>

		<media:content url="http://gigaom2.files.wordpress.com/2013/05/sw1-e1368211547401.jpg?w=708" medium="image">
			<media:title type="html">sw1</media:title>
		</media:content>

		<media:content url="http://gigaom2.files.wordpress.com/2013/05/sw2.jpg?w=708" medium="image">
			<media:title type="html">sw2</media:title>
		</media:content>

		<media:content url="http://gigaom2.files.wordpress.com/2013/05/sw3.jpg?w=708" medium="image">
			<media:title type="html">sw3</media:title>
		</media:content>
	</item>
		<item>
		<title>Teradata gets into the in-memory biz to take on SAP&#8217;s HANA</title>
		<link>http://gigaom.com/2013/05/08/teradata-gets-into-the-in-memory-biz-to-take-on-saps-hana/</link>
		<comments>http://gigaom.com/2013/05/08/teradata-gets-into-the-in-memory-biz-to-take-on-saps-hana/#comments</comments>
		<pubDate>Wed, 08 May 2013 14:07:43 +0000</pubDate>
		<dc:creator>Derrick Harris</dc:creator>
				<category><![CDATA[analytics]]></category>
		<category><![CDATA[big data]]></category>
		<category><![CDATA[data warehouse]]></category>
		<category><![CDATA[database]]></category>
		<category><![CDATA[in-memory database]]></category>
		<category><![CDATA[Teradata]]></category>

		<guid isPermaLink="false">http://gigaom.com/?p=643284</guid>
		<description><![CDATA[Teradata is trying to steal some thunder in the in-memory analytics space with a new technology called Intelligent Memory that places hot data in RAM while dispersing the rest across solid-state drives and disk.<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=gigaom.com&#038;blog=14960843&#038;post=643284&#038;subd=gigaom2&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
				<content:encoded><![CDATA[<p>Data analytics veteran Teradata will not let the new era of data-analysis architectures pass it by without a fight. It has already built products to address massive data volumes and Hadoop, and on Wednesday it announced an in-memory database technology to answer the industry’s latest call.</p>
<p>Speed is the driving factory behind the in-memory analytics push that spans everyone from classic Teradata <a href="http://gigaom.com/2013/01/11/sap-marries-transaction-processing-with-analytics-by-putting-business-suite-on-hana/">rivals like SAP</a> and Oracle to startups <a href="http://gigaom.com/2013/01/18/can-a-new-database-help-get-zynga-back-on-track/">such as MemSQL</a>. Estimates vary as to the exact speed difference between data access in RAM versus hard disk, but Teradata is claiming RAM is 3,000 times faster. The speed difference between RAM and solid-state drives or flash memory is smaller, although still significant.</p>
<p>Of course, cost also comes into play, as the speed and cost tend to go hand in hand when it comes to storage media. That’s one reason Teradata says its new technology, called Intelligent Memory, doesn’t operate fully in-memory like some competitive offerings do. Rather, it places only the “hottest” data in memory for super-fast analysis and spreads the rest between solid-state drives and disk within a Teradata environment.</p>
<p><a href="http://gigaom2.files.wordpress.com/2013/05/tdc2.jpg"><img alt="tdc2" src="http://gigaom2.files.wordpress.com/2013/05/tdc2.jpg?w=708"   class="aligncenter size-full wp-image-643317"></a></p>
<p>This concept of intelligent data placement has been around a while in the storage space (it’s part of <a href="http://gigaom.com/2013/05/06/emc-plots-software-defined-data-center-journey-from-vipr-storage-virtualization-base/">EMC’s new ViPR software-defined storage platform</a>, too), but the advent of big data and abundant flash has given it some new life. Many companies <a href="http://gigaom.com/2012/09/10/nimble-storage-gets-40m-as-ipo-approaches/">desire a tiered system</a> in which they can pay more for fast access to their important or hot data, while saving some cash on lower-performance for their older and less-accessed data. Facebook is <a href="http://gigaom.com/2013/01/16/why-facebook-might-put-blu-ray-to-use-on-big-data/">really pushing the envelope here</a> with its cold storage initiative — something VP of Engineering Jay Parikh will likely discuss at our <a href="http://event.gigaom.com/structure/?utm_source=data&amp;utm_medium=editorial&amp;utm_campaign=intext&amp;utm_term=643284+teradata-gets-into-the-in-memory-biz-to-take-on-saps-hana&amp;utm_content=dharrisstructure">Structure conference</a> June 19 and 20 in San Francisco.</p>
<p>In analytics, though, RAM, not flash, is the fastest medium out there. Whether someone goes all-RAM or a tiered approach like Teradata pushing probably depends on how much performance they need across how much data, as well as how much they’re willing to pay. But if you’re doing interactive analytics in the next decade, they’re almost certain to be in-memory to some degree.</p>
<p><em>Feature image courtesy of <a href="http://www.shutterstock.com/gallery-537709p1.html">Shutterstock user Hellen Sergeyeva</a>.</em></p>
<br />  <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=gigaom.com&#038;blog=14960843&#038;post=643284&#038;subd=gigaom2&#038;ref=&#038;feed=1" width="1" height="1" /><p><a href="http://pubads.g.doubleclick.net/gampad/jump?iu=/1008864/GigaOM_RSS_300x250&#038;sz=300x250&#038;c=73240"><img src="http://pubads.g.doubleclick.net/gampad/ad?iu=/1008864/GigaOM_RSS_300x250&#038;sz=300x250&#038;c=73240" /></a></p><p><strong>Related research and analysis from GigaOM Pro:</strong><br />Subscriber content. <a href="http://pro.gigaom.com/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=643284+teradata-gets-into-the-in-memory-biz-to-take-on-saps-hana&utm_content=dharrisstructure">Sign up for a free trial</a>.</p><ul><li><a href="http://pro.gigaom.com/2010/09/the-red-hot-data-warehouse-market-whos-buying-next/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=643284+teradata-gets-into-the-in-memory-biz-to-take-on-saps-hana&utm_content=dharrisstructure">The Red-Hot Data Warehouse Market: Who&#8217;s Buying Next?</a></li><li><a href="http://pro.gigaom.com/2012/05/the-importance-of-putting-the-u-and-i-in-visualization/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=643284+teradata-gets-into-the-in-memory-biz-to-take-on-saps-hana&utm_content=dharrisstructure">The importance of putting the U and I in visualization</a></li><li><a href="http://pro.gigaom.com/2010/10/will-hadoop-vendors-profit-from-banks-big-data-woes/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=643284+teradata-gets-into-the-in-memory-biz-to-take-on-saps-hana&utm_content=dharrisstructure">Will Hadoop Vendors Profit from Banks&#8217; Big Data Woes?</a></li></ul>]]></content:encoded>
			<wfw:commentRss>http://gigaom.com/2013/05/08/teradata-gets-into-the-in-memory-biz-to-take-on-saps-hana/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:thumbnail url="http://gigaom2.files.wordpress.com/2013/05/shutterstock_127075202.jpg?w=150" />
		<media:content url="http://gigaom2.files.wordpress.com/2013/05/shutterstock_127075202.jpg?w=150" medium="image">
			<media:title type="html">ram memory</media:title>
		</media:content>

		<media:content url="http://0.gravatar.com/avatar/9e48ffa0913f65c577727457dd63023f?s=96&#38;d=retro&#38;r=PG" medium="image">
			<media:title type="html">dharrisstructure</media:title>
		</media:content>

		<media:content url="http://gigaom2.files.wordpress.com/2013/05/tdc2.jpg" medium="image">
			<media:title type="html">tdc2</media:title>
		</media:content>
	</item>
		<item>
		<title>How MailChimp learned to treat data like orange juice and rethink email in the process</title>
		<link>http://gigaom.com/2013/05/05/how-mailchimp-learned-to-treat-data-like-orange-juice-and-rethink-email-in-the-process/</link>
		<comments>http://gigaom.com/2013/05/05/how-mailchimp-learned-to-treat-data-like-orange-juice-and-rethink-email-in-the-process/#comments</comments>
		<pubDate>Sun, 05 May 2013 23:09:53 +0000</pubDate>
		<dc:creator>Derrick Harris</dc:creator>
				<category><![CDATA[analytics]]></category>
		<category><![CDATA[artificial intelligence]]></category>
		<category><![CDATA[big data]]></category>
		<category><![CDATA[clustering]]></category>
		<category><![CDATA[email marketing]]></category>
		<category><![CDATA[machine-learning]]></category>
		<category><![CDATA[MailChimp]]></category>
		<category><![CDATA[natural language processing]]></category>
		<category><![CDATA[predictive models]]></category>
		<category><![CDATA[semantic analysis]]></category>

		<guid isPermaLink="false">http://gigaom.com/?p=642316</guid>
		<description><![CDATA[MailChimp wasn't always a big data company, but 12 years into its existence the company is using its mountains of email data to do everything from modeling spam to connecting subscribers.<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=gigaom.com&#038;blog=14960843&#038;post=642316&#038;subd=gigaom2&#038;ref=&#038;feed=1" width="1" height="1" />]]></description>
				<content:encoded><![CDATA[<p>MailChimp Chief Data Scientist John Foreman likes to talk about orange juice. On the surface, it&#8217;s a strange way to start a discussion about data, but it all starts to make sense when you peel back the rind. It&#8217;s a way of thinking that&#8217;s letting MailChimp &#8212; which sends about 35 billion emails a year on behalf of roughly 3 million users &#8212; transform itself into a data-driven business 12 years into its existence.</p>
<p>When you&#8217;re in Atlanta, as I was during a recent trip, the obvious place to start talking about orange juice and data is with Coca-Cola. Foreman can tell you all about how the beverage giant &#8212; whose headquarters tower over the city just a just a mile away from MailChimp&#8217;s office &#8212; <a href="http://www.businessweek.com/articles/2013-01-31/coke-engineers-its-orange-juice-with-an-algorithm">uses advanced algorithms and giant vats of different juices</a> to ensure the proper flavor of its Simply Orange line of orange juice. However, it&#8217;s something else Coca-Cola is doing that inspired the way Foreman thinks about data and that&#8217;s helping MailChimp re-imagine what it means to engage with fans, readers and customer through their inboxes.</p>
<p>Anyone familiar with how large web companies <a href="http://gigaom.com/2013/03/04/the-history-of-hadoop-from-4-nodes-to-the-future-of-data/">came to pioneer the practice of what we now call &#8220;big data&#8221;</a> should appreciate the analogy. Coca-Cola, which also owns Minute Maid, produces a lot of excess pulp when it makes orange juice. For decades, presumably, it had just been throwing that pulp away, but in 2006 it decided to make use of it by launching a new product called Minute Maid Pulpy. Sold primarily in Asian countries, Pulpy <a href="http://www.ajc.com/news/business/coca-colas-minute-maid-pulpy-reaches-1-billion-in-/nQqFM/">has become a billion-dollar business</a> for Coca-Cola.</p>
<p>Once MailChimp is done with its primary business of sending emails, it has a lot of pulp of its own in the form of data. And rather than just ignoring it or writing up some cute blog posts (<a href="http://blog.mailchimp.com/author/jforeman/">which he also does</a>), Foreman and his bosses want to turn that data into revenue.</p>
<h2 id="first-things-first-making-bett">First things first: Making better orange juice</h2>
<div id="attachment_642357" class="wp-caption alignleft" style="width: 310px"><a href="http://gigaom2.files.wordpress.com/2013/05/20130424_121443.jpg"><img  alt="Neil Bainton" src="http://gigaom2.files.wordpress.com/2013/05/20130424_121443-e1367793432461.jpg?w=300&#038;h=200" width="300" height="200" class="size-medium wp-image-642357" /></a><p class="wp-caption-text">Neil Bainton</p></div>
<p>Actually, though, MailChimp first brought in Foreman in 2011 to help the company improve its core business of letting users build and send their emails. MailChimp&#8217;s culture was built around many things, COO Neil Bainton told me, but data wasn&#8217;t one of them. It had &#8220;various fits and starts&#8221; through the years trying to work data into its business model, and each step just added more complexity.</p>
<p>The challenges were technological as well as cultural, but Foreman had a plan, of which focus was a key aspect. Keeping a tight focus meant Foreman and his lone-developer sidekick could build what they needed to in a short timeframe. It also meant the company didn&#8217;t have to worry about some massive overnight transformation into a data-obsessed company like Google.</p>
<div id="attachment_642358" class="wp-caption alignright" style="width: 310px"><a href="http://gigaom2.files.wordpress.com/2013/05/20130424_121423.jpg"><img  alt="John Foreman" src="http://gigaom2.files.wordpress.com/2013/05/20130424_121423-e1367793376856.jpg?w=300&#038;h=200" width="300" height="200" class="size-medium wp-image-642358" /></a><p class="wp-caption-text">John Foreman</p></div>
<p>&#8220;[They] don&#8217;t need to be afraid the entire culture is gonna fall down if we bring in this weird math guy,&#8221; he joked.</p>
<p>Foreman&#8217;s first project &#8212; deploying artificial intelligence models that would <a href="http://blog.mailchimp.com/project-omnivore-three-years-of-gorging-on-data/">automatically detect spammy email lists from MailChimp&#8217;s users</a> &#8211; is actually critical to the way MailChimp operates, though. It was up and running in production within a year, after a technologically challenging effort of merging separate database instances for each customer into a single environment that would let MailChimp run complex analyses across its customer base.</p>
<p>It&#8217;s such an important project, Foreman explained, because internet service and email providers keep reputation scores on the IP addresses that send email through their systems. Because MailChimp serves as the email engine for its millions of users, sending too many messages that get flagged as spam and lower MailChimp&#8217;s reputation will have a negative impact on everyone. The company used to deal with spam manually, and only after recipients began complaining about the messages they received.</p>
<p>&#8220;It used to be before we had that AI model in place that everyone had a crappier experience,&#8221; Foreman said.</p>
<h2 id="say-goodbye-to-those-90s-fans-">Say goodbye to those &#8217;90s fans, Pearl Jam</h2>
<div id="attachment_642362" class="wp-caption alignleft" style="width: 310px"><a href="http://gigaom2.files.wordpress.com/2013/05/bcdf-1024x864.png"><img  alt="Source: MailChimp" src="http://gigaom2.files.wordpress.com/2013/05/bcdf-1024x864.png?w=300&#038;h=253" width="300" height="253" class="size-medium wp-image-642362" /></a><p class="wp-caption-text">Source: MailChimp</p></div>
<p>Now, however, MailChimp knows some of the telltale signs of spam for which it should be on the lookout. If too high a percentage of email addresses on a given list are also <a href="http://blog.mailchimp.com/aol-and-hotmail-users-spend-more-than-gmail-users-and-other-research-finds/">available via publicly available lists</a> or those you can buy on sketchy corners of the internet, it&#8217;s probably spam. Too many old and far-more-likely-to-be-dead Earthlink or Compuserve addresses, or letters within one keystroke of each other as if someone just mashed the keyboard? Probably spam.</p>
<p>Thankfully, though, about 98 percent of the spam that MailChimp identifies is what Foreman calls &#8220;ignorant&#8221; &#8212; that is, people or companies that just don&#8217;t know the laws or best practices around sending emails. But ignorance doesn&#8217;t mean MailChimp relaxes its rules. Recently, it even flagged Pearl Jam for spammy practices because the band was trying to reconnect with old fans whose email addresses read like a who&#8217;s who list of 1990s email providers.</p>
<p>Having such a high percentage of ignorant spam actually has a positive effect on the company&#8217;s overall goal of monetizing its vast data repositories. Because the AI model automates what used to be a manual process, and because most innocent spammers will fall in line quickly once they&#8217;re notified (as opposed to nefarious spammers who constantly try to outsmart the system), MailChimp can pretty much set the model loose, forget about it and get to work on new efforts, Foreman said.</p>
<h2 id="now-about-that-pulp">Now, about that pulp</h2>
<p>Spam under control, MailChimp can focus its efforts on actually building new products with data, just like Coca-Cola did with that extra pulp. One of its first orders of business is figuring out how to help customers get to know better the people to whom they&#8217;re sending their newsletters.</p>
<p>With this in mind, the company built a service called <a href="http://wavelength.mailchimpapp.com/">Wavelength</a> that shows customers other newsletters that are similar to theirs. But the system that powers Wavelength also stores pretty much every interaction that every email address in the company&#8217;s database has with the newsletters they&#8217;re sent. That means what emails they open and when they open them, what links they click and when they click them, and what other newsletters they&#8217;re subscribed to. MailChimp also has a feature called <a href="http://kb.mailchimp.com/article/what-is-ecommerce360-and-how-does-it-work-with-mailchimp">Ecommerce360</a> that lets customers track clicks right through to conversions (marketing speak for someone actually buying something).</p>
<p>The company has been <a href="http://blog.mailchimp.com/digging-deeper-into-wavelength-and-egp-data-finding-interest-clusters-in-mailchimps-network/">playing around with this data to identify clusters of users</a> based on their behaviors and their interests &#8212; some of which Foreman has detailed on the company&#8217;s blog &#8212; and now it wants to roll it out to customers via a product MailChimp is calling ChimpQuery. Built atop <a href="http://gigaom.com/2013/03/14/google-bigquery-is-now-even-bigger/">Google&#8217;s BigQuery analytics service</a>, ChimpQuery will let customers start doing this type of clustering and segmentation on their own, while saving MailChimp the troubles of hosting that infrastructure itself. (You can play with a monstrous, interactive graph of the entire MailChimp subscriber list <a href="http://zoom.it/HD3t#full">here</a>.)</p>
<p>If you sell knitting supplies and you find out there&#8217;s a big cluster of people on your mailing list who also are interested in wedding planning and custom jewelry, there might be an opportunity to create your content with these interests in mind or even to partner with companies in those spaces.</p>
<div id="attachment_642360" class="wp-caption aligncenter" style="width: 718px"><a href="http://gigaom2.files.wordpress.com/2013/05/marriedknit-tiff.jpg"><img  alt="A sample cluster of subscribers." src="http://gigaom2.files.wordpress.com/2013/05/marriedknit-tiff.jpg?w=708&#038;h=427" width="708" height="427" class="size-large wp-image-642360" /></a><p class="wp-caption-text">A sample cluster of subscribers.</p></div>
<p>Another topic that has been on Foreman&#8217;s mind lately is what he calls &#8220;frequency elasticity of engagement.&#8221; <a href="http://blog.mailchimp.com/sending-frequency-more-is-not-always-better/">He&#8217;s done research</a> suggesting that blasting the heck out of your email list might actually have detrimental effects in the long term (regardless of <a href="http://gigaom.com/2012/12/08/how-obamas-data-scientists-built-a-volunteer-army-on-facebook/">how the Obama campaign successfully exploited this strategy</a>) but noted that engagement also has a lot to do with content and a particular company&#8217;s given user list. MailChimp&#8217;s data could help customers figure out the ideal schedule for emailing their subscribers.</p>
<p>For example, Birchbox has really high engagement because people love the service and have to open their emails to find out what goodies they&#8217;re receiving. Emails from a company like Papa John&#8217;s, on the other hand, might sit in someone&#8217;s inbox essentially as spam until they want to order a pizza and go searching for a coupon. Everyone has to figure out what pace and engagement metrics work for them.</p>
<h2 id="reining-expectations-back-in">Reining expectations back in</h2>
<p>However, now that management is fully sold on the power of data, Foreman sometimes finds himself managing expectations rather than just pitching his ideas. COO Bainton, for example, is adamant that MailChimp start aiding its publishing-industry customers by using techniques such as natural-language processing and semantic analysis to help them personalize emails based on readers stated and unstated interests (that is, what boxes they check when they sign up and what stuff they actually click on).</p>
<p>Foreman, well, he&#8217;s pretty sure that&#8217;s too big a challenge for MailChimp to tackle considering how many publishing customers it has. MailChimp would have to understand all those customers&#8217; industries to some degree (<a href="http://www.opencalais.com/about">open source tools</a> tend to highlight technically but not situationally relevant relationships, he said, and don&#8217;t always understand things like sarcasm) and probably the different languages they publish in, as well. Rather than understand content, he&#8217;d rather focus personalization efforts around how users are connected.</p>
<p>The company also needs to balance its ambitions with what&#8217;s legally and socially acceptable. The creep factor might be more important than what&#8217;s legal when it comes to email marketing. MailChimp determines the legality of everything it does before rolling it out, Foreman explained, but in era of &#8220;post-modern spam&#8221; where legitimacy is in the eye of the recipient and where some people use their &#8220;spam&#8221; button as a proxy for unsubscribing, companies must be careful not to offend.</p>
<p>&#8220;The more we can tell you about that list without getting creepy is really useful,&#8221; Bainton said. However, he added, &#8221;I think expectation is more important than law.&#8221;</p>
<br />  <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=gigaom.com&#038;blog=14960843&#038;post=642316&#038;subd=gigaom2&#038;ref=&#038;feed=1" width="1" height="1" /><p><a href="http://pubads.g.doubleclick.net/gampad/jump?iu=/1008864/GigaOM_RSS_300x250&#038;sz=300x250&#038;c=571745"><img src="http://pubads.g.doubleclick.net/gampad/ad?iu=/1008864/GigaOM_RSS_300x250&#038;sz=300x250&#038;c=571745" /></a></p><p><strong>Related research and analysis from GigaOM Pro:</strong><br />Subscriber content. <a href="http://pro.gigaom.com/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=642316+how-mailchimp-learned-to-treat-data-like-orange-juice-and-rethink-email-in-the-process&utm_content=dharrisstructure">Sign up for a free trial</a>.</p><ul><li><a href="http://pro.gigaom.com/2012/01/why-the-next-front-in-big-data-might-be-psychological/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=642316+how-mailchimp-learned-to-treat-data-like-orange-juice-and-rethink-email-in-the-process&utm_content=dharrisstructure">Why the next front in big data might be psychological</a></li><li><a href="http://pro.gigaom.com/2010/10/will-hadoop-vendors-profit-from-banks-big-data-woes/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=642316+how-mailchimp-learned-to-treat-data-like-orange-juice-and-rethink-email-in-the-process&utm_content=dharrisstructure">Will Hadoop Vendors Profit from Banks&#8217; Big Data Woes?</a></li><li><a href="http://pro.gigaom.com/2010/09/the-red-hot-data-warehouse-market-whos-buying-next/?utm_source=data&utm_medium=editorial&utm_campaign=auto3&utm_term=642316+how-mailchimp-learned-to-treat-data-like-orange-juice-and-rethink-email-in-the-process&utm_content=dharrisstructure">The Red-Hot Data Warehouse Market: Who&#8217;s Buying Next?</a></li></ul>]]></content:encoded>
			<wfw:commentRss>http://gigaom.com/2013/05/05/how-mailchimp-learned-to-treat-data-like-orange-juice-and-rethink-email-in-the-process/feed/</wfw:commentRss>
		<slash:comments>4</slash:comments>
	
		<media:thumbnail url="http://gigaom2.files.wordpress.com/2013/05/joyusgray-e1367794217987.png?w=150" />
		<media:content url="http://gigaom2.files.wordpress.com/2013/05/joyusgray-e1367794217987.png?w=150" medium="image">
			<media:title type="html">JoyusGray</media:title>
		</media:content>

		<media:content url="http://0.gravatar.com/avatar/9e48ffa0913f65c577727457dd63023f?s=96&#38;d=retro&#38;r=PG" medium="image">
			<media:title type="html">dharrisstructure</media:title>
		</media:content>

		<media:content url="http://gigaom2.files.wordpress.com/2013/05/20130424_121443-e1367793432461.jpg?w=300" medium="image">
			<media:title type="html">Neil Bainton</media:title>
		</media:content>

		<media:content url="http://gigaom2.files.wordpress.com/2013/05/20130424_121423-e1367793376856.jpg?w=300" medium="image">
			<media:title type="html">John Foreman</media:title>
		</media:content>

		<media:content url="http://gigaom2.files.wordpress.com/2013/05/bcdf-1024x864.png?w=300" medium="image">
			<media:title type="html">Source: MailChimp</media:title>
		</media:content>

		<media:content url="http://gigaom2.files.wordpress.com/2013/05/marriedknit-tiff.jpg?w=708" medium="image">
			<media:title type="html">A sample cluster of subscribers.</media:title>
		</media:content>
	</item>
	</channel>
</rss>
