<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	xmlns:georss="http://www.georss.org/georss" xmlns:geo="http://www.w3.org/2003/01/geo/wgs84_pos#" xmlns:media="http://search.yahoo.com/mrss/"
	>

<channel>
	<title>James Dixon's Blog</title>
	<atom:link href="http://jamesdixon.wordpress.com/feed/" rel="self" type="application/rss+xml" />
	<link>http://jamesdixon.wordpress.com</link>
	<description>James Dixon's thoughts on commercial open source and open source business intelligence</description>
	<lastBuildDate>Wed, 18 Jan 2012 21:18:58 +0000</lastBuildDate>
	<language>en</language>
	<sy:updatePeriod>hourly</sy:updatePeriod>
	<sy:updateFrequency>1</sy:updateFrequency>
	<generator>http://wordpress.com/</generator>
<cloud domain='jamesdixon.wordpress.com' port='80' path='/?rsscloud=notify' registerProcedure='' protocol='http-post' />
<image>
		<url>http://s2.wp.com/i/buttonw-com.png</url>
		<title>James Dixon's Blog</title>
		<link>http://jamesdixon.wordpress.com</link>
	</image>
	<atom:link rel="search" type="application/opensearchdescription+xml" href="http://jamesdixon.wordpress.com/osd.xml" title="James Dixon&#039;s Blog" />
	<atom:link rel='hub' href='http://jamesdixon.wordpress.com/?pushpress=hub'/>
		<item>
		<title>Exporting, Reporting, and Visualizing: Get more from your data in MongoDB</title>
		<link>http://jamesdixon.wordpress.com/2012/01/18/exporting-reporting-and-visualizing-get-more-from-your-data-in-mongodb/</link>
		<comments>http://jamesdixon.wordpress.com/2012/01/18/exporting-reporting-and-visualizing-get-more-from-your-data-in-mongodb/#comments</comments>
		<pubDate>Wed, 18 Jan 2012 19:57:20 +0000</pubDate>
		<dc:creator>James</dc:creator>
				<category><![CDATA[Uncategorized]]></category>
		<category><![CDATA[Pentaho MongoDB]]></category>

		<guid isPermaLink="false">http://jamesdixon.wordpress.com/?p=819</guid>
		<description><![CDATA[I&#8217;m presenting this session tomorrow at the MongoDB LA conference. We&#8217;ve got some great tech to demo. Tweet tag &#8211; #mongodbLA<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=jamesdixon.wordpress.com&amp;blog=3802959&amp;post=819&amp;subd=jamesdixon&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>I&#8217;m presenting this session tomorrow at the MongoDB LA conference. We&#8217;ve got some great tech to demo.<br />
Tweet tag &#8211; #mongodbLA</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/jamesdixon.wordpress.com/819/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/jamesdixon.wordpress.com/819/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/jamesdixon.wordpress.com/819/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/jamesdixon.wordpress.com/819/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/jamesdixon.wordpress.com/819/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/jamesdixon.wordpress.com/819/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/jamesdixon.wordpress.com/819/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/jamesdixon.wordpress.com/819/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/jamesdixon.wordpress.com/819/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/jamesdixon.wordpress.com/819/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/jamesdixon.wordpress.com/819/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/jamesdixon.wordpress.com/819/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/jamesdixon.wordpress.com/819/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/jamesdixon.wordpress.com/819/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=jamesdixon.wordpress.com&amp;blog=3802959&amp;post=819&amp;subd=jamesdixon&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://jamesdixon.wordpress.com/2012/01/18/exporting-reporting-and-visualizing-get-more-from-your-data-in-mongodb/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">jimmyed2000</media:title>
		</media:content>
	</item>
		<item>
		<title>Pentaho BI 4.0 Thin Client APIs and Theming webinar tomorrow</title>
		<link>http://jamesdixon.wordpress.com/2011/08/30/pentaho-bi-4-0-thin-client-apis-and-theming-webinar-tomorrow/</link>
		<comments>http://jamesdixon.wordpress.com/2011/08/30/pentaho-bi-4-0-thin-client-apis-and-theming-webinar-tomorrow/#comments</comments>
		<pubDate>Tue, 30 Aug 2011 18:13:38 +0000</pubDate>
		<dc:creator>James</dc:creator>
				<category><![CDATA[Uncategorized]]></category>

		<guid isPermaLink="false">http://jamesdixon.wordpress.com/?p=817</guid>
		<description><![CDATA[Tomorrow I&#8217;m doing a session about the new data access APIs in the V4.0 release, as well sharing some knowledge about the new theme system in the BI server. Here is the session info for those that are interested: Topic: Pentaho Community Technical WebEx &#8211; James Dixon &#8211; Pentaho BI 4.0 Thin Client APIs and [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=jamesdixon.wordpress.com&amp;blog=3802959&amp;post=817&amp;subd=jamesdixon&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>Tomorrow I&#8217;m doing a session about the new data access APIs in the V4.0 release, as well sharing some knowledge about the new theme system in the BI server.</p>
<p>Here is the session info for those that are interested:</p>
<p>Topic: Pentaho Community Technical WebEx &#8211; James Dixon &#8211; Pentaho BI 4.0 Thin Client APIs and Theming<br />
Date and Time:</p>
<p style="padding-left:30px;">Wednesday, August 31, 2011 10:00 am, Eastern Daylight Time (New York, GMT-04:00)<br />
Wednesday, August 31, 2011 2:00 pm, Greenwich Time (Reykjavik, GMT)<br />
Wednesday, August 31, 2011 4:00 pm, Europe Summer Time (Paris, GMT+02:00)<br />
Thursday, September 1, 2011 12:00 am, Australia Eastern Standard Time (Sydney, GMT+10:00)</p>
<p>Event number: 712 776 191<br />
Event password: opensource</p>
<p>&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;-<br />
To join the online event<br />
&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;-<br />
1. <a href="https://pentaho.webex.com/pentaho/onstage/g.php?d=712776191&amp;t=a&amp;EA=dev.pentaho%40pentaho.org&amp;ET=4b3a4deb21d439ad703449b420e9bb36&amp;ETR=de22fea937a9b0976b3a1b466f7ab631&amp;RT=MiMxMQ==&amp;p">Click here to join the online event</a>.<br />
Or copy and paste the following link to a browser:</p>
<p>https://pentaho.webex.com/pentaho/onstage/g.php?d=712776191&#038;t=a&#038;EA=dev.pentaho%40pentaho.org&#038;ET=4b3a4deb21d439ad703449b420e9bb36&#038;ETR=de22fea937a9b0976b3a1b466f7ab631&#038;RT=MiMxMQ==&#038;p</p>
<p>2. Click &#8220;Join Now&#8221;.</p>
<p>&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;-<br />
To join the teleconference only<br />
&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;&#8212;-<br />
Call-in toll-free number (US/Canada): 1-866-699-3239<br />
Call-in toll number (US/Canada): 1-408-792-6300<br />
Global call-in numbers: https://pentaho.webex.com/pentaho/globalcallin.php?serviceType=EC&amp;ED=161656302&amp;tollFree=1<br />
Toll-free dialing restrictions: http://www.webex.com/pdf/tollfree_restrictions.pdf<br />
Access code: 712 776 191</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/jamesdixon.wordpress.com/817/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/jamesdixon.wordpress.com/817/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/jamesdixon.wordpress.com/817/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/jamesdixon.wordpress.com/817/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/jamesdixon.wordpress.com/817/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/jamesdixon.wordpress.com/817/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/jamesdixon.wordpress.com/817/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/jamesdixon.wordpress.com/817/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/jamesdixon.wordpress.com/817/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/jamesdixon.wordpress.com/817/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/jamesdixon.wordpress.com/817/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/jamesdixon.wordpress.com/817/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/jamesdixon.wordpress.com/817/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/jamesdixon.wordpress.com/817/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=jamesdixon.wordpress.com&amp;blog=3802959&amp;post=817&amp;subd=jamesdixon&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://jamesdixon.wordpress.com/2011/08/30/pentaho-bi-4-0-thin-client-apis-and-theming-webinar-tomorrow/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">jimmyed2000</media:title>
		</media:content>
	</item>
		<item>
		<title>Using open source software is not a sin. We encourage it.</title>
		<link>http://jamesdixon.wordpress.com/2011/06/29/using-open-source-software-is-not-a-sin-we-encourage-it/</link>
		<comments>http://jamesdixon.wordpress.com/2011/06/29/using-open-source-software-is-not-a-sin-we-encourage-it/#comments</comments>
		<pubDate>Wed, 29 Jun 2011 21:22:40 +0000</pubDate>
		<dc:creator>James</dc:creator>
				<category><![CDATA[Uncategorized]]></category>

		<guid isPermaLink="false">http://jamesdixon.wordpress.com/?p=812</guid>
		<description><![CDATA[Brian Gentile of Jaspersoft usually has some interesting and worthwhile things to say on his blog. But, in his latest post, he seems to have gone stark raving mad (to put it politely). The sin in open source comes from contributing neither one’s time nor money He makes the bold statement that using open source [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=jamesdixon.wordpress.com&amp;blog=3802959&amp;post=812&amp;subd=jamesdixon&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>Brian Gentile of Jaspersoft usually has some interesting and worthwhile things to say on his blog. But, in <a href="http://openbookonbi.blogspot.com/2011/06/sin-in-open-source.html">his latest pos</a>t, he seems to have gone stark raving mad (to put it politely).</p>
<blockquote><p>The sin in open source comes from contributing neither one’s time nor money</p></blockquote>
<p>He makes the bold statement that using open source software without contributing to that project is a sin. I’m not misquoting him, he says its a sin.</p>
<p>He goes on to say that if you use JasperSoft community edition you are required to contribute.</p>
<blockquote><p>Your contribution is required.</p></blockquote>
<p>This is called quid-pro-quo – they does something for you and you must do something for them. In some parts of the planet, certain forms of quid-pro-quo are classified as harassment and are illegal. This attitude towards community also rates very low on the openness scale &#8211; Gentile is only open to community members who are going to contribute  directly, and within a time-frame that Jaspersoft finds agreeable. I’m not sure the OSI will approve that license.</p>
<p>Obviously I disagree with his statements. Completely. Utterly. On multiple fronts.</p>
<h2><span style="font-size:large;"><strong>Self-Interest</strong></span></h2>
<p>Firstly, open source works best when all participants act purely out of self-interest, and by doing so, the other participants benefit as a side effect. Here are some examples:</p>
<ul>
<li><strong>Reduce Future Work</strong>: I have contributed bug fixes to Apache foundation and JBoss projects. I did this not because I feel an obligation to do so, but because I want them to maintain the patch in future versions so I don’t have to continually merge my change with each new version. I contribute my bug fixes purely out of self-interest – I want to reduce my future workload. I also didn’t go looking for those bugs. I came across those bugs while trying to use their open source software to solve a real problem or requirement I faced. By contributing my fixes out of self-interested all the other participants gain higher quality software.</li>
</ul>
<ul>
<li><strong>Education and Career</strong>: In prior decades it was not easy to show potential employers your prior work – because often all of it was the proprietary intellectual property of your previous employers. Today, if you are a software engineer, technical writer, graphic artist etc, you can contribute to open source projects as a way of demonstrating your work. This is particularly true of certain open source projects – if you have contributed code to the Linux kernel your lifetime earning potential is probably higher as a result. If you are a software engineer and you want to work at RedHat, your application for a position will considered significantly more if you are active in their community.</li>
</ul>
<ul>
<li><strong>Getting It Done</strong>: Community members don’t post questions on forums for fun. They do it because they have a problem of some kind, and it is stopping them from getting something done. Maybe their question get answered, maybe it doesn’t. Either way the question is a contribution – often a question it identifies a problem with the installer, or the documentation, or a feature, or the download site, or the expectations set by the web site etc. The asker of the question did not ask it in order to gently identify an opportunity for improvement, they did it out of self-interest, but it still counts as a contribution.</li>
</ul>
<ul>
<li><strong>Status and Satisfaction</strong>: It is satisfying to contribute in a community. There is also status and reputation to be gained. While this form of reward is not monetary, career-driven, or externally noticeable, is a benefit that is derived by the participant. If the community member did not feel this satisfaction, they would not waste their time contributing. If there is a particular application area you are interested in (music, graphics, gaming, mobile devices etc), but there are no career opportunities open to you, you can participate in an open source project to satisfy your interest/curiosity.</li>
</ul>
<ul>
<li><strong>Business</strong>: Some companies sponsor projects by encouraging (sometimes requiring) their employees to contribute to open source projects. In some cases these companies do this because they are services companies that want to demonstrate expertise with certain technologies to help attract new customers. The company gains attention and reputation, and in doing so the open source project and community benefit from the time and resources (selfishly) donated. Other companies sponsor their employees to contribute because the company relies on the software operationally. To reduce their risk of failures and downtime, the company needs to have engineers on staff who have deep technical knowledge of the software.</li>
</ul>
<ul>
<li><strong>Changing Market Dynamics</strong>: The act of choosing to use open source software instead of a proprietary alternative changes the market dynamics in favor of commercial open source companies. Just using the software is a contribution. Sometimes those users tell other people about the software they are using, and encourage them to use it. The community grows, and the market changes more. Over time this dynamic and the continual community growth help all the participants.</li>
</ul>
<p>As you can see there are many varied reasons people contribute to open source. In all these cases the participants are acting out of self-interest, but the community as a whole benefits from these selfish actions. But guilt and obligation are not on this list &#8211; they are very weak motivations.</p>
<p>With a commercial open source software (COSS) project you have a company that is the single most important participating organization. The motivations of this company are very important. It does not matter which company you look at, whether it’s RedHat, MySQL (Oracle), Pentaho, or Jaspersoft, that company exists for self-interest – to make money. There is nothing wrong with this, it’s actually very healthy. If the stewarding company is acting out of self-interest, you should not expect the community to act differently.</p>
<h2><span style="font-size:large;"><strong>Monetizing the Community</strong></span></h2>
<p>Secondly Gentile is making an elementary mistake, one that is common among those that are new to the COSS business model. Gentile states ”Open source communities thrive based on the community members donating either their time and/or money”. Within the COSS world getting community members to buy software and services is called ‘Monetizing the Community’. It is a clumsy term that encourages misguided actions. I refer to my <a title="6. Commercial Open Source Model" href="http://jamesdixon.wordpress.com/the-bees-and-the-trees/commercial-open-source-model/">Beekeeper model</a>. In there I state:</p>
<blockquote><p>Customers are corporations, the community are people. They have very different needs.</p></blockquote>
<p><strong></strong>The Beekeeper model makes it clear that it is pointless for a COSS company to try to sell it’s enterprise software and services to community members. This statement is true for all COSS companies that focus on business software (it is not true for open source consumer software such as games). This distinction is important, and it is missing from Gentile’s desperate plea. I’m guessing that only a very small percentage of the Jaspersoft installations are for personal use. Reporting software just isn’t that much fun. The majority of Jaspersoft’s installations are for business purposes. The individual who installed the software is usually a technical end user or an IT developer. Either way, the individual is not going to buy the software for their own needs &#8211; if a purchase of software is made, the customer will be the employer, not the community member. As a COSS company you can provide tools for your community members to persuade their employers to become customers, and you can explain how this benefits both companies involved and the community. For most COSS companies is it impossible to monetize the community directly, and therefore ridiculous to try. Trying to berate community members into purchasing business software shows a remarkable lack of understanding of the commercial open source business model. Asking, begging, or requiring community members to purchase your software is futile, Gentile.</p>
<p>I’m not pretending that the COSS business model is easy. I’m not pretending that Pentaho does not have room for improvement either. I am stating that Pentaho provides more BI functionality in open source than Jaspersoft, and that you are welcome to use that software &#8211; sin-free and guilt-free.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/jamesdixon.wordpress.com/812/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/jamesdixon.wordpress.com/812/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/jamesdixon.wordpress.com/812/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/jamesdixon.wordpress.com/812/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/jamesdixon.wordpress.com/812/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/jamesdixon.wordpress.com/812/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/jamesdixon.wordpress.com/812/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/jamesdixon.wordpress.com/812/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/jamesdixon.wordpress.com/812/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/jamesdixon.wordpress.com/812/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/jamesdixon.wordpress.com/812/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/jamesdixon.wordpress.com/812/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/jamesdixon.wordpress.com/812/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/jamesdixon.wordpress.com/812/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=jamesdixon.wordpress.com&amp;blog=3802959&amp;post=812&amp;subd=jamesdixon&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://jamesdixon.wordpress.com/2011/06/29/using-open-source-software-is-not-a-sin-we-encourage-it/feed/</wfw:commentRss>
		<slash:comments>6</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">jimmyed2000</media:title>
		</media:content>
	</item>
		<item>
		<title>olap4j V1.0 has been released.</title>
		<link>http://jamesdixon.wordpress.com/2011/04/12/olap4j-v1-0-has-been-released/</link>
		<comments>http://jamesdixon.wordpress.com/2011/04/12/olap4j-v1-0-has-been-released/#comments</comments>
		<pubDate>Tue, 12 Apr 2011 12:24:23 +0000</pubDate>
		<dc:creator>James</dc:creator>
				<category><![CDATA[Business Intelligence]]></category>
		<category><![CDATA[commercial open source]]></category>
		<category><![CDATA[open source]]></category>

		<guid isPermaLink="false">http://jamesdixon.wordpress.com/?p=808</guid>
		<description><![CDATA[Back in the &#8217;90s and early 2000&#8242;s I was involved in the attempts by the proprietary BI vendors to create common standards. Anyone remember JOLAP? The vendors were doing this only because of increasing demand and frustration from their customers &#8211; none of them actually these standards. Why? Because, in the short term, standards would [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=jamesdixon.wordpress.com&amp;blog=3802959&amp;post=808&amp;subd=jamesdixon&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>Back in the &#8217;90s and early 2000&#8242;s I was involved in the attempts by the proprietary BI vendors to create common standards. Anyone remember JOLAP? The vendors were doing this only because of increasing demand and frustration from their customers &#8211; none of them actually these standards. Why? Because, in the short term, standards would only help the customers and the implementers, not the vendors. These efforts were hugely political with many of the vendors taking the opportunity to score points against each other. The resulting &#8216;standards&#8217; were useless, and none of the large vendors were willing, or able, to support them.</p>
<p>How refreshing, then, to have olap4j reach the 1.0 milestone &#8211; <a href="http://www.olap4j.org/">http://www.olap4j.org</a>. Created by consumers and producers of open source BI software, olap4j shows the advantage of open collaboration by motivated parties. Already olap4j has a Mondrian driver, and an XMLA driver for Microsoft SQL Server  Analysis Services, SAP BW, and Jedox Palo. There are also several clients who use olap4j servers, some from Pentaho, and Saiku, Wabit, and ADANS.</p>
<p>olap4j is very cool stuff. You can read more on <a href="http://julianhyde.blogspot.com/2011/04/olap4j-version-10-released.html">Julian Hyde&#8217;s blog</a>. Congratulations for everyone that has worked on olap4j.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/jamesdixon.wordpress.com/808/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/jamesdixon.wordpress.com/808/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/jamesdixon.wordpress.com/808/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/jamesdixon.wordpress.com/808/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/jamesdixon.wordpress.com/808/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/jamesdixon.wordpress.com/808/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/jamesdixon.wordpress.com/808/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/jamesdixon.wordpress.com/808/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/jamesdixon.wordpress.com/808/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/jamesdixon.wordpress.com/808/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/jamesdixon.wordpress.com/808/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/jamesdixon.wordpress.com/808/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/jamesdixon.wordpress.com/808/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/jamesdixon.wordpress.com/808/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=jamesdixon.wordpress.com&amp;blog=3802959&amp;post=808&amp;subd=jamesdixon&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://jamesdixon.wordpress.com/2011/04/12/olap4j-v1-0-has-been-released/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">jimmyed2000</media:title>
		</media:content>
	</item>
		<item>
		<title>More Hadoop in New York City</title>
		<link>http://jamesdixon.wordpress.com/2011/01/27/more-hadoop-in-new-york-city/</link>
		<comments>http://jamesdixon.wordpress.com/2011/01/27/more-hadoop-in-new-york-city/#comments</comments>
		<pubDate>Thu, 27 Jan 2011 16:01:39 +0000</pubDate>
		<dc:creator>James</dc:creator>
				<category><![CDATA[Agile BI]]></category>
		<category><![CDATA[Business Intelligence]]></category>
		<category><![CDATA[commercial open source]]></category>
		<category><![CDATA[Hadoop]]></category>
		<category><![CDATA[Hive]]></category>

		<guid isPermaLink="false">http://jamesdixon.wordpress.com/?p=805</guid>
		<description><![CDATA[Yesterday was fun. First I met with a potential customer looking to try Hadoop for a big data project. Then I had a lengthy and interesting chat with Dan Woods. Amongst other things Dan runs http://www.citoresearch.com/ and also blogs for Forbes. We talked about Pentaho&#8217;s history and our experiences so far with the commercial open [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=jamesdixon.wordpress.com&amp;blog=3802959&amp;post=805&amp;subd=jamesdixon&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>Yesterday was fun. First I met with a potential customer looking to try Hadoop for a big data project.</p>
<p>Then I had a lengthy and interesting chat with Dan Woods. Amongst other things Dan runs <a href="http://www.citoresearch.com/">http://www.citoresearch.com/</a> and also blogs for <a href="http://blogs.forbes.com/ciocentral/2010/12/15/how-cios-should-be-helping-marketers/">Forbes</a>. We talked about Pentaho&#8217;s history and our experiences so far with the commercial open source model.   We also talked about Hadoop and big data and about the vision and roadmap of our Agile BI offering.</p>
<p>Next I met with Steve Lohr who is a <a href="http://topics.nytimes.com/top/reference/timestopics/people/l/steve_lohr/index.html">technology reporter for the New York Times</a>. We talked about many topics including the enterprise software markets and how open source is affecting them. We also talked about Hadoop, of course.</p>
<p>Next was a co-meet-up of the New York Predictive Analytics and No-SQL groups where I presented decks about Weka and Hadoop, separately and together. There were lots of interesting questions and side discussions earlier. By the time we finished all these topics a blizzard was going on out side. Cabs were nowhere to be seen so Matt Gershoff of Conductrics was kind enough to lead me via the subway to the vicinity of my hotel.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/jamesdixon.wordpress.com/805/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/jamesdixon.wordpress.com/805/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/jamesdixon.wordpress.com/805/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/jamesdixon.wordpress.com/805/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/jamesdixon.wordpress.com/805/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/jamesdixon.wordpress.com/805/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/jamesdixon.wordpress.com/805/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/jamesdixon.wordpress.com/805/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/jamesdixon.wordpress.com/805/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/jamesdixon.wordpress.com/805/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/jamesdixon.wordpress.com/805/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/jamesdixon.wordpress.com/805/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/jamesdixon.wordpress.com/805/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/jamesdixon.wordpress.com/805/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=jamesdixon.wordpress.com&amp;blog=3802959&amp;post=805&amp;subd=jamesdixon&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://jamesdixon.wordpress.com/2011/01/27/more-hadoop-in-new-york-city/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">jimmyed2000</media:title>
		</media:content>
	</item>
		<item>
		<title>Big Data in New York City</title>
		<link>http://jamesdixon.wordpress.com/2011/01/26/big-data-in-new-york-city/</link>
		<comments>http://jamesdixon.wordpress.com/2011/01/26/big-data-in-new-york-city/#comments</comments>
		<pubDate>Wed, 26 Jan 2011 17:20:59 +0000</pubDate>
		<dc:creator>James</dc:creator>
				<category><![CDATA[Agile BI]]></category>
		<category><![CDATA[Business Intelligence]]></category>
		<category><![CDATA[commercial open source]]></category>
		<category><![CDATA[Hadoop]]></category>
		<category><![CDATA[open source]]></category>

		<guid isPermaLink="false">http://jamesdixon.wordpress.com/?p=802</guid>
		<description><![CDATA[I&#8217;m having an interesting time in NYC this week. I had to retrieve my snowboarding jacket out of the attic for this trip. It&#8217;s snowing right now, which is better than the sleet forecast for later. So far I&#8217;ve met with a few Big Data customers and prospects and presented at the New York Hadoop [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=jamesdixon.wordpress.com&amp;blog=3802959&amp;post=802&amp;subd=jamesdixon&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>I&#8217;m having an interesting time in NYC this week. I had to retrieve my snowboarding jacket out of the attic for this trip. It&#8217;s snowing right now, which is better than the sleet forecast for later. So far I&#8217;ve met with a few Big Data customers and prospects and presented at the New York Hadoop User Group. Our hybrid database/Hadoop data lake architecture always gets a good reception and our ability to run our data integration engine within the Hadoop data nodes impresses people.</p>
<p>Being the first Business Intelligence vendor to bring reporting and ETL to the Hadoop space sets us apart from all the other vendors. We have so much recognition in this space that I&#8217;ve spoken to a few people in the last month who thought we were &#8216;THE&#8217; visualization and data transformation provider for Hadoop and didn&#8217;t connect to other data sources.</p>
<p>This afternoon I&#8217;m meeting with reporters and columnists from a couple of different publications to chat about Big Data / Hadoop stuff. Tonight I&#8217;m presenting at the New York Predictive Analytics Meetup to talk about Hadoop from an analysis perspective.</p>
<p>&nbsp;</p>
<p>&nbsp;</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/jamesdixon.wordpress.com/802/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/jamesdixon.wordpress.com/802/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/jamesdixon.wordpress.com/802/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/jamesdixon.wordpress.com/802/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/jamesdixon.wordpress.com/802/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/jamesdixon.wordpress.com/802/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/jamesdixon.wordpress.com/802/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/jamesdixon.wordpress.com/802/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/jamesdixon.wordpress.com/802/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/jamesdixon.wordpress.com/802/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/jamesdixon.wordpress.com/802/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/jamesdixon.wordpress.com/802/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/jamesdixon.wordpress.com/802/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/jamesdixon.wordpress.com/802/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=jamesdixon.wordpress.com&amp;blog=3802959&amp;post=802&amp;subd=jamesdixon&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://jamesdixon.wordpress.com/2011/01/26/big-data-in-new-york-city/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">jimmyed2000</media:title>
		</media:content>
	</item>
		<item>
		<title>Meetups and Pentaho Summit(s) coming up in January</title>
		<link>http://jamesdixon.wordpress.com/2011/01/05/meetups-and-pentaho-summits-coming-up-in-january/</link>
		<comments>http://jamesdixon.wordpress.com/2011/01/05/meetups-and-pentaho-summits-coming-up-in-january/#comments</comments>
		<pubDate>Wed, 05 Jan 2011 21:20:34 +0000</pubDate>
		<dc:creator>James</dc:creator>
				<category><![CDATA[Agile BI]]></category>
		<category><![CDATA[Business Intelligence]]></category>
		<category><![CDATA[commercial open source]]></category>
		<category><![CDATA[Hadoop]]></category>
		<category><![CDATA[Hive]]></category>
		<category><![CDATA[open source]]></category>

		<guid isPermaLink="false">http://jamesdixon.wordpress.com/?p=796</guid>
		<description><![CDATA[It&#8217;s going to be a busy month. January 19th and 20th is our Global 2011 Summit in San Francisco. I have three sessions Pentaho for Hadoop, Extending Pentaho&#8217;s Capabilities, and an Architecture Overview. So I&#8217;m creating and digging up some new sample plug-ins and extensions. I&#8217;m also going to take part in an Q&#38;A session [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=jamesdixon.wordpress.com&amp;blog=3802959&amp;post=796&amp;subd=jamesdixon&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>It&#8217;s going to be a busy month.</p>
<p>January 19th and 20th is our <a href="http://www.pentaho.com/events/20110119_global_partner_summit/?fotm=y" target="_blank">Global 2011 Summit</a> in San Francisco. I have three sessions Pentaho for Hadoop, Extending Pentaho&#8217;s Capabilities, and an Architecture Overview. So I&#8217;m creating and digging up some new sample plug-ins and extensions. I&#8217;m also going to take part in an Q&amp;A session with the Penaho architects since Julian Hyde (Mondrian), Matt Casters (PDI/Kettle), Thomas Morgner (Pentaho Reporting) will all be there. Who should attend?</p>
<blockquote><p>CTOs, architects, product managers, business executives and partner-facing staff from System Integrators and Resellers, as well as Software Providers with a need to embed business intelligence or data integration software into your products.</p></blockquote>
<p>We usually have customers and prospects attending our summits as well.</p>
<p>We are also having an architect&#8217;s summit that same week to work on our 2011 technology road-map. That should be a lot of fun.</p>
<p>The week after that I&#8217;ll be in New York presenting at the NYC Hadoop User Group on Tuesday, January 25 and the NYC Predictive Analytics Meetup on Wednesday January 26th.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/jamesdixon.wordpress.com/796/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/jamesdixon.wordpress.com/796/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/jamesdixon.wordpress.com/796/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/jamesdixon.wordpress.com/796/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/jamesdixon.wordpress.com/796/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/jamesdixon.wordpress.com/796/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/jamesdixon.wordpress.com/796/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/jamesdixon.wordpress.com/796/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/jamesdixon.wordpress.com/796/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/jamesdixon.wordpress.com/796/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/jamesdixon.wordpress.com/796/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/jamesdixon.wordpress.com/796/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/jamesdixon.wordpress.com/796/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/jamesdixon.wordpress.com/796/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=jamesdixon.wordpress.com&amp;blog=3802959&amp;post=796&amp;subd=jamesdixon&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://jamesdixon.wordpress.com/2011/01/05/meetups-and-pentaho-summits-coming-up-in-january/feed/</wfw:commentRss>
		<slash:comments>1</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">jimmyed2000</media:title>
		</media:content>
	</item>
		<item>
		<title>150,000 installations year-to-date for Pentaho</title>
		<link>http://jamesdixon.wordpress.com/2010/11/15/150000-installations-year-to-date-for-pentaho/</link>
		<comments>http://jamesdixon.wordpress.com/2010/11/15/150000-installations-year-to-date-for-pentaho/#comments</comments>
		<pubDate>Mon, 15 Nov 2010 15:27:37 +0000</pubDate>
		<dc:creator>James</dc:creator>
				<category><![CDATA[Business Intelligence]]></category>
		<category><![CDATA[commercial open source]]></category>
		<category><![CDATA[open source]]></category>

		<guid isPermaLink="false">http://jamesdixon.wordpress.com/?p=770</guid>
		<description><![CDATA[Our most recent figures show 156,000 copies of Pentaho software were installed so far this year. These numbers are not download numbers, but installed software that has been used. This includes Pentaho servers and some Pentaho client tools. These numbers do not represent only long-term installations, but also do not represent all Pentaho&#8217;s software distributions [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=jamesdixon.wordpress.com&amp;blog=3802959&amp;post=770&amp;subd=jamesdixon&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>Our most recent figures show 156,000 copies of Pentaho software were installed so far this year. These numbers are not download numbers, but installed software that has been used. This includes Pentaho servers and some Pentaho client tools. These numbers do not represent only long-term installations, but also do not represent all Pentaho&#8217;s software distributions or installations. Since these numbers are not absolutel</p>
<p>An analysis by country of these numbers shows interesting results.</p>
<h2>The Long Tail</h2>
<p>This chart shows the number of new installations year-to-date for each country. Our data shows new Pentaho installations in 176 countries so far this year. That&#8217;s out of a total of 229 countries.</p>
<p><a href="http://jamesdixon.files.wordpress.com/2010/11/new-pentaho-installs-long-tail.png"><img class="aligncenter size-full wp-image-779" title="New Pentaho Installs Long Tail" src="http://jamesdixon.files.wordpress.com/2010/11/new-pentaho-installs-long-tail.png?w=700" alt=""   /></a>This is clearly a classic long tail. In fact after the first 20 or 30 countries it is difficult to read values from the chart. This second chart uses a log scale. The line on this chart is almost perfectly linear, showing that the distribution by country is pretty much logarithmic.</p>
<p><a href="http://jamesdixon.files.wordpress.com/2010/11/new-pentaho-installs-long-tail-log.png"><img class="aligncenter size-full wp-image-778" title="New Pentaho Installs Long Tail Log" src="http://jamesdixon.files.wordpress.com/2010/11/new-pentaho-installs-long-tail-log.png?w=700" alt=""   /></a>Over the same time period Pentaho has customers in 46 countries. This is a larger geographic spread than most of the proprietary BI companies.</p>
<p>Since we are dealing with country-based data, here is the analysis I did using Google Geo Map, Pentaho Data Integration, and Pentaho BI Server.</p>
<h2>New Pentaho Installs Jan-Oct 2010</h2>
<p>This shows the geographic spread of the installations.</p>
<p><a href="http://jamesdixon.files.wordpress.com/2010/11/new-pentaho-installs.png"><img class="aligncenter size-full wp-image-774" title="New Pentaho Installs" src="http://jamesdixon.files.wordpress.com/2010/11/new-pentaho-installs.png?w=700&#038;h=449" alt="" width="700" height="449" /></a></p>
<p>It is fairly obvious from the map above that the highest number of installations were in the USA, China, and Brazil, followed by India and parts of Europe. But this simplistic graphic does take into account the economics or demographics of the countries. How does the number of installations relate to the size or economic power of each country?</p>
<h2>New Installations Per $Billion GDP</h2>
<p>If we look at the number of new installations of Pentaho software per billion dollars of GDP we see a different picture. The GDP data is from the <a href="https://www.cia.gov/library/publications/the-world-factbook/index.html" target="_blank">CIA World Factbook</a></p>
<p><a href="http://jamesdixon.files.wordpress.com/2010/11/new-pentaho-installs-per-gdp.png"><img class="aligncenter size-full wp-image-772" title="New Pentaho Installs per billion $ GDP" src="http://jamesdixon.files.wordpress.com/2010/11/new-pentaho-installs-per-gdp.png?w=700&#038;h=449" alt="" width="700" height="449" /></a></p>
<p>I capped &#8216;Installs Per Bn GDP&#8217; at 10 to prevent outliers from skewing the color gradient.</p>
<p>Compared with the first map the prominence of the USA and Chine is reduced, and the areas of high activity are shown to be South America followed by Europe and parts of Asia. But analysis using GDP alone does not take into account things like exchange rates and the cost-of-living within a country &#8211; as a result there is probably a bias towards countries like the South American ones. So I went to find metrics that should remove bias of economic factors.</p>
<h2>New Installations Per 100k Labor Force</h2>
<p>If we look at the number of new Pentaho installs compared with the labor force of each country we  get a slightly different picture. The labor force data is from the <a href="https://www.cia.gov/library/publications/the-world-factbook/index.html" target="_blank">CIA World Factbook</a></p>
<p><a href="http://jamesdixon.files.wordpress.com/2010/11/new-pentaho-installs-per-labor.png"><img class="aligncenter size-full wp-image-773" title="New Pentaho Installs per 100k Labor Force" src="http://jamesdixon.files.wordpress.com/2010/11/new-pentaho-installs-per-labor.png?w=700&#038;h=449" alt="" width="700" height="449" /></a></p>
<p>I capped &#8216;Installs Per 100k Labor Force&#8217; at 50 to prevent outliers from skewing the color gradient.</p>
<p>Compared with the first two maps, this one shows the South America, Europe, and North America countries roughly equal to each other. Australia and New Zealand are also comparable. Asia, Africa, and the Middle East are shown to be generally behind. What is odd about this graphic is that countries like India, generally considered to be significant open source consumers, are not shown to be within the leading countries. This is because, I&#8217;m assuming, that a large percentage of the labor force is agricultural, and as such, less likely to be doing much BI.</p>
<h2>New Installations Per 100k Internet Users</h2>
<p>So instead of labor force, let&#8217;s look at new installations of Pentaho for every 100k internet users within a country.</p>
<p><a href="http://jamesdixon.files.wordpress.com/2010/11/new-pentaho-installs-per-internet-users.png"><img class="aligncenter size-full wp-image-781" title="New Pentaho Installs per Internet Users" src="http://jamesdixon.files.wordpress.com/2010/11/new-pentaho-installs-per-internet-users.png?w=700&#038;h=417" alt="" width="700" height="417" /></a></p>
<p>I capped &#8216;Installs Per 100k Internet Users&#8217; at 50 to prevent outliers from skewing the color gradient.</p>
<p>Here we see that South America is still prominent, along with southern Europe. The rest of Europe and North America come second along with India, other parts of Asia and Australia. South Africa also makes a showing for the first time. China however does not show strongly.</p>
<p>This metric &#8211; Installations per 100k Internet Users &#8211; seems like a reasonable way to compare the adoption of software between countries. &#8216;Internet Users&#8217;, by definition, have access to a computer (needed to run FOSS) and to the internet (needed to get FOSS). This metric is not skewed by the percentage of the population that are not internet users, and is not skewed by cost-of-living or exchange rates.</p>
<p>Here are the top 40 countries for new Pentaho installations per 100k internet users ( for countries with over 1 million internet users).</p>
<p><a href="http://jamesdixon.files.wordpress.com/2010/11/top-40-installers-per-internet-users.png"><img class="aligncenter size-full wp-image-782" title="Top 40 Installers Per Internet Users" src="http://jamesdixon.files.wordpress.com/2010/11/top-40-installers-per-internet-users.png?w=700&#038;h=586" alt="" width="700" height="586" /></a></p>
<p>There is a bias still. Countries with a lower percentage of internet users in the total population will be rated higher than those with very high percentage. This is because in the first case, the individuals with internet access will tend to be those in business, i.e. those with a higher than normal need for BI tools. Whereas in the second case the internet users include relatively more families and individuals &#8211; those with a lower need for BI tools. This bias would not affect the installation figures of software such as Firefox, but would affect the ratings in Pentaho&#8217;s case.</p>
<p>If we group the countries into regions we see some other interesting things. This scatter chart shows number internet users on the X axis and new installations of Pentaho software on the Y axis.</p>
<p><a href="http://jamesdixon.files.wordpress.com/2010/11/internet-users-vs-installations.png"><img class="aligncenter" title="Internet Users vs Installations" src="http://jamesdixon.files.wordpress.com/2010/11/internet-users-vs-installations.png?w=700&#038;h=427" alt="" width="700" height="427" /></a></p>
<p>Interestingly the USA, South America, and Asia come out with around the same total number of installations (approx 30,000), but the chart shows a large difference (100m up to 550m) in the number of internet users within those regions. Europe, as a region, has the highest number of new installations, with a 50% margin over the second place region.</p>
<p>So which metric do you think is most valuable? And for what purpose?</p>
<p>Also interesting to note is that the 2010 installations numbers represent, for each country, 40-50% of the all-time (2007-2010) installation figures. This means that the number of new installations so far in 2010 is about the same as the number of installations in the previous 3 years combined.</p>
<h2>About This Analysis</h2>
<p>And yes, I used Pentaho software to do this analysis &#8211; I used Pentaho&#8217;s Agile BI process.</p>
<ul>
<li>Iteration 1: I first loaded the &#8216;new installations&#8217; data into a table to do the histograms and the first map. After seeing the map, it occurred to me that just looking at the installation figures was not very interesting, and that comparing installations to GDP might be better.</li>
<li>Iteration 2: So I went to find GDP data and added it to the table using Pentaho Data Integration. After seeing the &#8216;Pentaho Installs Per $dn GDP&#8217;  map it occurred to me that other metrics might show different, and better, results &#8211; so I went to find other data sets, not knowing what I might find.</li>
<li>Iteration 3: At the CIA World Factbook I found Labor Force and Internet Users. I added these to the table and looked at the maps. At this point I decided that comparing installation counts with the total number of internet users in a country was a good metric.</li>
</ul>
<p>It took three iterations of finding data, merge/calculate/load, and visualization before I settled on an analysis I thought was optimal. The important point here is that until I saw the data visualized, the next question did not occur to me, so a one-pass &#8216;requirements&#8217; -&gt; &#8216;design&#8217; -&gt; &#8216;implement&#8217; -&gt; &#8216;visualize&#8217; process would not have worked.</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/jamesdixon.wordpress.com/770/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/jamesdixon.wordpress.com/770/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/jamesdixon.wordpress.com/770/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/jamesdixon.wordpress.com/770/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/jamesdixon.wordpress.com/770/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/jamesdixon.wordpress.com/770/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/jamesdixon.wordpress.com/770/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/jamesdixon.wordpress.com/770/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/jamesdixon.wordpress.com/770/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/jamesdixon.wordpress.com/770/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/jamesdixon.wordpress.com/770/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/jamesdixon.wordpress.com/770/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/jamesdixon.wordpress.com/770/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/jamesdixon.wordpress.com/770/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=jamesdixon.wordpress.com&amp;blog=3802959&amp;post=770&amp;subd=jamesdixon&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://jamesdixon.wordpress.com/2010/11/15/150000-installations-year-to-date-for-pentaho/feed/</wfw:commentRss>
		<slash:comments>7</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">jimmyed2000</media:title>
		</media:content>

		<media:content url="http://jamesdixon.files.wordpress.com/2010/11/new-pentaho-installs-long-tail.png" medium="image">
			<media:title type="html">New Pentaho Installs Long Tail</media:title>
		</media:content>

		<media:content url="http://jamesdixon.files.wordpress.com/2010/11/new-pentaho-installs-long-tail-log.png" medium="image">
			<media:title type="html">New Pentaho Installs Long Tail Log</media:title>
		</media:content>

		<media:content url="http://jamesdixon.files.wordpress.com/2010/11/new-pentaho-installs.png" medium="image">
			<media:title type="html">New Pentaho Installs</media:title>
		</media:content>

		<media:content url="http://jamesdixon.files.wordpress.com/2010/11/new-pentaho-installs-per-gdp.png" medium="image">
			<media:title type="html">New Pentaho Installs per billion $ GDP</media:title>
		</media:content>

		<media:content url="http://jamesdixon.files.wordpress.com/2010/11/new-pentaho-installs-per-labor.png" medium="image">
			<media:title type="html">New Pentaho Installs per 100k Labor Force</media:title>
		</media:content>

		<media:content url="http://jamesdixon.files.wordpress.com/2010/11/new-pentaho-installs-per-internet-users.png" medium="image">
			<media:title type="html">New Pentaho Installs per Internet Users</media:title>
		</media:content>

		<media:content url="http://jamesdixon.files.wordpress.com/2010/11/top-40-installers-per-internet-users.png" medium="image">
			<media:title type="html">Top 40 Installers Per Internet Users</media:title>
		</media:content>

		<media:content url="http://jamesdixon.files.wordpress.com/2010/11/internet-users-vs-installations.png" medium="image">
			<media:title type="html">Internet Users vs Installations</media:title>
		</media:content>
	</item>
		<item>
		<title>Data Quality Issue Sparks Invasion of Costa Rica</title>
		<link>http://jamesdixon.wordpress.com/2010/11/07/data-quality-issue-sparks-invasion-of-costa-rica/</link>
		<comments>http://jamesdixon.wordpress.com/2010/11/07/data-quality-issue-sparks-invasion-of-costa-rica/#comments</comments>
		<pubDate>Sun, 07 Nov 2010 03:37:44 +0000</pubDate>
		<dc:creator>James</dc:creator>
				<category><![CDATA[Business Intelligence]]></category>

		<guid isPermaLink="false">http://jamesdixon.wordpress.com/?p=768</guid>
		<description><![CDATA[When it comes to data, quality is king. Validating that the data is right is an important part of a BI project. Get the data wrong, and bad things can happen. For example: the State Department sends Google bad border data &#8211; and Costa Rica gets invaded. http://searchengineland.com/nicaragua-raids-costa-rica-blames-google-maps-54885 http://edition.cnn.com/2010/TECH/web/11/05/nicaragua.raid.google.maps/ That&#8217;s my new favorite data quality [...]<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=jamesdixon.wordpress.com&amp;blog=3802959&amp;post=768&amp;subd=jamesdixon&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>When it comes to data, quality is king. Validating that the data is right is an important part of a BI project. Get the data wrong, and bad things can happen.</p>
<p>For example: the State Department sends Google bad border data &#8211; and Costa Rica gets invaded.</p>
<p><a href="http://searchengineland.com/nicaragua-raids-costa-rica-blames-google-maps-54885" target="_blank">http://searchengineland.com/nicaragua-raids-costa-rica-blames-google-maps-54885</a></p>
<p><a href="http://edition.cnn.com/2010/TECH/web/11/05/nicaragua.raid.google.maps/" target="_blank">http://edition.cnn.com/2010/TECH/web/11/05/nicaragua.raid.google.maps/</a></p>
<p>That&#8217;s my new favorite data quality anecdote</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/jamesdixon.wordpress.com/768/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/jamesdixon.wordpress.com/768/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/jamesdixon.wordpress.com/768/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/jamesdixon.wordpress.com/768/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/jamesdixon.wordpress.com/768/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/jamesdixon.wordpress.com/768/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/jamesdixon.wordpress.com/768/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/jamesdixon.wordpress.com/768/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/jamesdixon.wordpress.com/768/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/jamesdixon.wordpress.com/768/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/jamesdixon.wordpress.com/768/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/jamesdixon.wordpress.com/768/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/jamesdixon.wordpress.com/768/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/jamesdixon.wordpress.com/768/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=jamesdixon.wordpress.com&amp;blog=3802959&amp;post=768&amp;subd=jamesdixon&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://jamesdixon.wordpress.com/2010/11/07/data-quality-issue-sparks-invasion-of-costa-rica/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">jimmyed2000</media:title>
		</media:content>
	</item>
		<item>
		<title>SalesForce needs a good CRM system</title>
		<link>http://jamesdixon.wordpress.com/2010/11/05/salesforce-needs-a-good-crm-system/</link>
		<comments>http://jamesdixon.wordpress.com/2010/11/05/salesforce-needs-a-good-crm-system/#comments</comments>
		<pubDate>Fri, 05 Nov 2010 23:30:13 +0000</pubDate>
		<dc:creator>James</dc:creator>
				<category><![CDATA[Uncategorized]]></category>

		<guid isPermaLink="false">http://jamesdixon.wordpress.com/?p=766</guid>
		<description><![CDATA[Today I received some sales spam from SalesForce.com. Nothing unusual about that except that we are a customer of SalesForce.com. It&#8217;s not a good demonstration of their product capabilities if the king of SaaS Customer Relationship Management can&#8217;t internally identify who their customer are. #Fail SalesForce needs a better CRM system. Any suggestions?<img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=jamesdixon.wordpress.com&amp;blog=3802959&amp;post=766&amp;subd=jamesdixon&amp;ref=&amp;feed=1" width="1" height="1" />]]></description>
			<content:encoded><![CDATA[<p>Today I received some sales spam from SalesForce.com. Nothing unusual about that except that we are a customer of SalesForce.com.</p>
<p>It&#8217;s not a good demonstration of their product capabilities if the king of SaaS Customer Relationship Management can&#8217;t internally identify who their customer are. #Fail</p>
<p>SalesForce needs a better CRM system. Any suggestions?</p>
<br />  <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gocomments/jamesdixon.wordpress.com/766/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/comments/jamesdixon.wordpress.com/766/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godelicious/jamesdixon.wordpress.com/766/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/delicious/jamesdixon.wordpress.com/766/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gofacebook/jamesdixon.wordpress.com/766/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/facebook/jamesdixon.wordpress.com/766/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gotwitter/jamesdixon.wordpress.com/766/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/twitter/jamesdixon.wordpress.com/766/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/gostumble/jamesdixon.wordpress.com/766/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/stumble/jamesdixon.wordpress.com/766/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/godigg/jamesdixon.wordpress.com/766/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/digg/jamesdixon.wordpress.com/766/" /></a> <a rel="nofollow" href="http://feeds.wordpress.com/1.0/goreddit/jamesdixon.wordpress.com/766/"><img alt="" border="0" src="http://feeds.wordpress.com/1.0/reddit/jamesdixon.wordpress.com/766/" /></a> <img alt="" border="0" src="http://stats.wordpress.com/b.gif?host=jamesdixon.wordpress.com&amp;blog=3802959&amp;post=766&amp;subd=jamesdixon&amp;ref=&amp;feed=1" width="1" height="1" />]]></content:encoded>
			<wfw:commentRss>http://jamesdixon.wordpress.com/2010/11/05/salesforce-needs-a-good-crm-system/feed/</wfw:commentRss>
		<slash:comments>3</slash:comments>
	
		<media:content url="" medium="image">
			<media:title type="html">jimmyed2000</media:title>
		</media:content>
	</item>
	</channel>
</rss>
