<?xml version="1.0" encoding="UTF-8"?>
<?xml-stylesheet type="text/xsl" media="screen" href="/~d/styles/atom10full.xsl"?><?xml-stylesheet type="text/css" media="screen" href="http://feeds.feedburner.com/~d/styles/itemcontent.css"?><feed xmlns="http://www.w3.org/2005/Atom" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:thr="http://purl.org/syndication/thread/1.0" xmlns:feedburner="http://rssnamespace.org/feedburner/ext/1.0">
    <title>Tony Bain</title>
    
    <link rel="alternate" type="text/html" href="http://blog.tonybain.com/tony_bain/" />
    <id>tag:typepad.com,2003:weblog-140947</id>
    <updated>2009-11-10T18:03:25+11:00</updated>
    <subtitle>Innovations in Data Management</subtitle>
    <generator uri="http://www.typepad.com/">TypePad</generator>
    <link rel="self" href="http://feeds.feedburner.com/TonyBain" type="application/atom+xml" /><feedburner:emailServiceId>TonyBain</feedburner:emailServiceId><feedburner:feedburnerHostname>http://feedburner.google.com</feedburner:feedburnerHostname><feedburner:browserFriendly>This is an XML content feed. It is intended to be viewed in a newsreader or syndicated to another site, subject to copyright and fair use.</feedburner:browserFriendly><atom10:link xmlns:atom10="http://www.w3.org/2005/Atom" rel="hub" href="http://pubsubhubbub.appspot.com" /><entry>
        <title>Back from Blogging Hiatus - Update 3</title>
        <link rel="alternate" type="text/html" href="http://blog.tonybain.com/tony_bain/2009/11/back-from-blogging-hiatus-update-3.html" />
        <link rel="replies" type="text/html" href="http://blog.tonybain.com/tony_bain/2009/11/back-from-blogging-hiatus-update-3.html" thr:count="0" />
        <id>tag:typepad.com,2003:post-6a00d834559d1e69e20120a66d03f3970b</id>
        <published>2009-11-10T18:03:25+11:00</published>
        <updated>2009-11-10T18:25:41+11:00</updated>
        <summary>Image by Nathan Lanier via Flickr &lt;&lt; Back from Blogging Hiatus - Update 2 IngresNo specific announcements from Ingres other than I think the VectorWise stuff is progressing well. To me Ingres is a bit of a dark horse. They...</summary>
        <author>
            <name>Tony Bain</name>
        </author>
        <category scheme="http://www.sixapart.com/ns/types#category" term="Business Intelligence" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Cloud Databases" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Data Integration" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Database Management" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Microsoft SQL Server" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="MySQL" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="NoSQL" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Oracle" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Relational DB" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Web 2.0" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Web/Tech" />
        
        <category scheme="http://sixapart.com/ns/types#tag" term="Database" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Database management system" />
        <category scheme="http://sixapart.com/ns/types#tag" term="IBM" />
        <category scheme="http://sixapart.com/ns/types#tag" term="IBM DB2" />
        <category scheme="http://sixapart.com/ns/types#tag" term="MySQL" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Open source" />
        <category scheme="http://sixapart.com/ns/types#tag" term="RDBMS" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Relational database management system" />
        
<content type="html" xml:lang="en-AU" xml:base="http://blog.tonybain.com/tony_bain/">&lt;div xmlns="http://www.w3.org/1999/xhtml"&gt;&lt;p class="zemanta-img" style="margin: 1em; float: right; display: block; width: 250px;"&gt;&lt;a href="http://www.flickr.com/photos/31120344@N03/4091328042/"&gt;&lt;img alt="Boston (Photogra)phy Party" src="http://farm3.static.flickr.com/2533/4091328042_962eab01c2_m.jpg" style="border: medium none ; display: block;"&gt;&lt;/img&gt;&lt;/a&gt;&lt;span class="zemanta-img-attribution"&gt;Image by &lt;a href="http://www.flickr.com/photos/31120344@N03/4091328042/"&gt;Nathan Lanier&lt;/a&gt; via Flickr&lt;/span&gt;&lt;/p&gt;&lt;p&gt;&lt;a href="http://blog.tonybain.com/tony_bain/2009/11/back-from-hiatus-summary-update-2.html" target="_blank"&gt;&amp;lt;&amp;lt; Back from Blogging Hiatus - Update 2&lt;/a&gt;&lt;/p&gt;&lt;h2&gt;Ingres&lt;/h2&gt;No specific announcements from &lt;a href="http://www.ingres.com/" target="_blank"&gt;Ingres &lt;/a&gt;other than I think the &lt;a href="http://www.ingres.com/vectorwise/" target="_blank"&gt;VectorWise&lt;/a&gt; stuff is progressing well.&lt;br&gt;&lt;br&gt;To me Ingres is a bit of a dark horse.  They are open source and doing reasonable revenues.  And they are active in the enterprise market (something MySQL hasn’t really achieved).  But they remain largely off the radar in commentary surrounding the DBMS industry.&lt;br&gt;&lt;br&gt;My personal pick is this will start to change during the second half of next year.  Several things happening in the market (Oracle’s eventual acquisition of MySQL being a major one) and some things they have happening internally (VectorWise being a major one) I think will help to start to propel Ingres back into the RDBMS spotlight, especially in the enterprise.&lt;br&gt;&lt;br&gt;&lt;h2&gt;VoltDB&lt;/h2&gt;It sounds like &lt;a href="http://www.voltdb.com/" target="_blank"&gt;VoltDB &lt;/a&gt;is getting closer with some talk of being able to see an early version of the product soon.&lt;br&gt;&lt;br&gt;&lt;p&gt;VoltDB will be an interesting case to watch.  VoltDB (&lt;a href="http://www.vertica.com"&gt;Vertica&lt;/a&gt;’s “sister”) is a lightweight DBMS optimized for large scale transaction processing.  I don’t know which bits of the architecture they are ok for people to talk about yet so I won’t go into detail on that.  But regardless of the technology, VoltDB should be watched because of their transaction processing focus.  Many analytics DBMS vendors have entered the market over the last few years, but few transaction processing alternatives have set up shop recently.  This is for a few reasons, one major on being the transaction processing market is such a tough nut to crack.&lt;/p&gt;&lt;p&gt;It sounds as if VoltDB has been bootstrapped with funding help coming from a company who is involved in the stock market.   Certain areas of FSI obviously have “niche’s” that require high end distributed transaction processing, which is precisely where I am sure they will find their early traction.  But what will be interesting is if they can break out of this niche and start to engage the wider ISV community.  The go to market will be much different and much more difficult than what they have seen with Vertica.  But will luminaries like &lt;a href="http://en.wikipedia.org/wiki/Michael_Stonebraker" target="_blank"&gt;Stonebraker &lt;/a&gt;leading the way, who knows they may make a dent.&lt;/p&gt;&lt;em&gt;They funny thing with Michael Stonebraker is most of the companies or institutions he is involved with that I speak to, say that he is spending most of his time on "their" project.  I am actually starting to doubt there is one Michael Stonebraker and suspect cloning may somehow be involved…&lt;/em&gt;&lt;br&gt;&lt;br&gt;&lt;h2&gt;IBM DB2&lt;/h2&gt;I spoke to IBM a few weeks back when they announced their &lt;a href="http://www-01.ibm.com/software/data/db2/9/editions-features-purescale.html" target="_blank"&gt;DB2 PureScale&lt;/a&gt; technology.  PureScale is actually quite exciting.  But they chose to announce it around the time of Oracle OpenWorld and press attention was largely drowned out but, among other things, Larry’s persistent bagging of IBM.&lt;br&gt;&lt;br&gt;IBM DB2 PureScale is a technology solution which provides shared-disk clustering for DB2 on IBM Power Systems.  New nodes can be added online (a traditional problem for shared disk clustering), and node failures will not see new requests fail as they will be transparently routed to other available nodes (although I believe in progress transactions will fail).  This is done using the hardware architecture of the Power Systems, and also done in a way that doesn’t require any application code changes.&lt;br&gt;&lt;br&gt;&lt;p&gt;However, on a different note, is it seems part of IBM’s strategy for gaining customers from Oracle is to &lt;a href="http://db2news.wordpress.com/2009/09/15/plsql-support-in-db2/" target="_blank"&gt;make DB2 more compatible with Oracle&lt;/a&gt;.  They say imitation is the greatest form of flattery so I am not sure if IBM is paying Oracle a huge compliment here?  But more seriously, my concern about this strategy is I believe Oracle is very much in aware of, and in control of, their wins &amp;amp; losses and can put in preventative measures when they so desire to block any major hemorrhaging.  IBM, I don't think you want to put too much focus on chasing Oracle's cast offs.  DB2 is also good in it's own right and you need to do a better job of showcasing the platform to ISV's if you want to retain your pride of place.&lt;/p&gt;&lt;p&gt;Although, at least this may allow ISV’s to more easily support DB2 alongside Oracle. &lt;/p&gt;&lt;p&gt;&lt;/p&gt;&lt;h2&gt;XtremeData&lt;/h2&gt;&lt;a href="http://www.xtremedata.com/" target="_blank"&gt;XtremeData &lt;/a&gt;is yet another vendor to enter the MPP analytics space.  XtremeData is worthy of note because their product is built upon their unique FPGA.  Unlike other FPGA’s I have seen, I understand that theirs plugs into a spare CPU socket in the server.  The FPGA can then provide pushed down data streaming operations on data at rates available to the CPU bus (instead of the PCI bus other some other FPGA approaches use).  Although I haven’t seen any benchmark data yet for what this translates into.&lt;br&gt;&lt;br&gt;When I spoke to XtremeData their focus seemed to be very much on the very high end.  Large deployments of many nodes, in many racks, handling many hundreds of TB (or PB).  As I have spoken about before, the MPP space is very busy right now.  Most of the companies are naturally focusing on the mid-range MPP needs, so maybe focusing on the very large end is a smart way to differentiate.  This of course may change as they ramp up and I will be curious to see if there actually is a sustainable market at this very top end.&lt;br&gt;&lt;br&gt;&lt;h2&gt;NoSQL&lt;/h2&gt;There has been a lot happening in the NoSQL technologies (Mongo, Cassandra, Voldemort etc) which I will comment on in other posts.  But an annoying thing, which can sometimes happen with community open source initiatives, is the level of infighting and bickering has been rising steadily.  And this is not even on important technological decisions.  An example, a lot of the bandwidth of the NOSQL mailing list is debating what to call themselves (which degraded into personal attacks and name calling at one point).  NoSQL vs many other things, and even what the definition of NoSQL is.  This really highlights to me the importance of the commercialized organizations surrounding this technology to keeping providing the necessary beacons to focus on and more this initiative forward.&lt;br&gt;&lt;br&gt;&#xD;
&#xD;
&lt;div class="zemanta-pixie" style="margin-top: 10px; height: 15px;"&gt;&lt;a class="zemanta-pixie-a" href="http://reblog.zemanta.com/zemified/69c56191-4a6a-4af3-8b47-1bfdb9a92b4f/" title="Reblog this post [with Zemanta]"&gt;&lt;img alt="Reblog this post [with Zemanta]" class="zemanta-pixie-img " src="http://img.zemanta.com/reblog_e.png?x-id=69c56191-4a6a-4af3-8b47-1bfdb9a92b4f" style="border: medium none ; float: right;"&gt;&lt;/img&gt;&lt;/a&gt;&lt;span class="zem-script more-related pretty-attribution"&gt;&lt;script src="http://static.zemanta.com/readside/loader.js" type="text/javascript"&gt;&lt;/script&gt;&lt;/span&gt;&lt;/div&gt;&lt;/div&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=mtEXW7Pm-Ow:bc3jjRBtZNU:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=mtEXW7Pm-Ow:bc3jjRBtZNU:F7zBnMyn0Lo"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?i=mtEXW7Pm-Ow:bc3jjRBtZNU:F7zBnMyn0Lo" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=mtEXW7Pm-Ow:bc3jjRBtZNU:V_sGLiPBpWU"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?i=mtEXW7Pm-Ow:bc3jjRBtZNU:V_sGLiPBpWU" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/TonyBain/~4/mtEXW7Pm-Ow" height="1" width="1"/&gt;</content>


    </entry>
    <entry>
        <title>Back from Hiatus - Summary Update 2</title>
        <link rel="alternate" type="text/html" href="http://blog.tonybain.com/tony_bain/2009/11/back-from-hiatus-summary-update-2.html" />
        <link rel="replies" type="text/html" href="http://blog.tonybain.com/tony_bain/2009/11/back-from-hiatus-summary-update-2.html" thr:count="0" />
        <id>tag:typepad.com,2003:post-6a00d834559d1e69e20120a6afa153970c</id>
        <published>2009-11-06T15:03:22+11:00</published>
        <updated>2009-11-06T15:03:22+11:00</updated>
        <summary>Back from Hiatus - Summary Update 1 GoodDataGoodData has launched and they are providing a cloud based analytics platform for use in integration with online apps. Starting with some initial focus on SalesForce data, but working hard on expanding the...</summary>
        <author>
            <name>Tony Bain</name>
        </author>
        <category scheme="http://www.sixapart.com/ns/types#category" term="Business Intelligence" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Cloud Databases" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Data Integration" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Database Management" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Microsoft SQL Server" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="MySQL" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="NoSQL" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Relational DB" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Web 2.0" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Web/Tech" />
        
        <category scheme="http://sixapart.com/ns/types#tag" term="GoodData" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Infobright" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Kognitio" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Mark Logic" />
        
<content type="html" xml:lang="en-AU" xml:base="http://blog.tonybain.com/tony_bain/">&lt;p&gt;&lt;em&gt;&lt;a href="http://blog.tonybain.com/tony_bain/2009/11/back-from-hiatus-summary-update-1.html"&gt;Back from Hiatus - Summary Update 1&lt;/a&gt;&lt;br&gt;&lt;/em&gt;&lt;/p&gt;&lt;h2&gt;GoodData&lt;/h2&gt;&lt;a href="http://www.gooddata.com/" target="_blank"&gt;GoodData &lt;/a&gt;has launched and they are providing a cloud based analytics platform for use in integration with online apps.  Starting with some initial focus on SalesForce data, but working hard on expanding the list of ISV’s who choose to provide their customers analytics via GoodData.&lt;br&gt;&lt;br&gt;GoodData was started by “good guy” Czech serial entrepreneur &lt;a href="http://twitter.com/RomanStanek" target="_blank"&gt;Roman Stanek&lt;/a&gt; (NetBeans) and has just raised funds from Andressen Horowitz and appointed Time O’Reilly to the board.  GoodData is interesting because it is simple, accessible and available on demand.  Still early days but think Roman is on to another winner here.  Certainly recommend any ISV building cloud based apps to look at their platform.&lt;br&gt;&lt;br&gt;&lt;h2&gt;Mark Logic&lt;/h2&gt;I was keen to learn more about &lt;a href="http://www.marklogic.com/" target="_blank"&gt;Mark Logic&lt;/a&gt; as I didn’t understand their products in any detail.  David and Ron were more than obliging and I sat down with them last week for a run though.&lt;br&gt;&lt;br&gt;In short, I am impressed by the technology of Mark Logic.  It is a database that uses XML as the schema data model and XQuery as the primary query language.  But it is far more than and XML extension bolted on top of a traditional db engine (such as some of the XML capabilities in the more traditional RBDMS vendors).  Internally Mark Logic has all the important DBMS components but they are designed and optimized around the XML schema (query processor, indexing etc) from the ground up.  I also understand they have distributed multi-node capability, something which is still quite rare over in the general purpose RBDMS world. &lt;br&gt;&lt;br&gt;Mark Logic has a history in the content publishing market, as you would expect, because much “published” data is naturally represented in XML.  I did sense the team at Mark Logic is keen to break away from this niche a little (while at the same time respecting that this will likely remain their primary market).  Exactly how they go about this isn’t entirely clear to me as the world has kind of moved on from the “XML for everything” excitement that existed in the early 2000’s.  There will be plenty of case-by-case requirements, but a piecemeal market is hard to drive business development.  But publishing remains a clear staple and I am sure they can leverage this into a few more.&lt;br&gt;&lt;br&gt;I did get somewhat excited when we were talking about serializing JSON in and out of Mark Logic.  This is very topical in the web app market as we see a push towards client based web applications and web service dishing up JSON.  But this is not necessarily a money spinner as there are “free” offerings servicing this need already (CouchDB, MongoDB etc).  I understand Mark Logic is proprietary license so it might be hard to gain traction here.&lt;br&gt;&lt;br&gt;&lt;h2&gt;Kognitio&lt;/h2&gt;I spoke briefly with &lt;a href="http://www.kognitio.com/" target="_blank"&gt;Kognitio&lt;/a&gt; a couple of weeks back.  I hear very little about Kognitio so I was keen to speak to them about their progress.  Kognitio is a UK based company and provides a data warehouse appliance, while only launching in the US last year they have a much longer history in the UK.&lt;br&gt;&lt;br&gt;Kognitio seems to be taking an alternative approach to achieving growth than the one many of the US vendors are using.  While most of the US companies are venture backed and are pushing hard to gain market share, Kognitio on the other hand is privately backed and seems to be taking a slower and more methodical approach.  This has obviously served them well in the UK but it will be interesting how that plays out into the highly crowed, highly competitive US data warehousing scene.  It may turn out to be a true test to see who really does win out of the tortoise and the hare.&lt;br&gt;&lt;br&gt;&lt;h2&gt;Infobright&lt;/h2&gt;The big news at &lt;a href="http://www.infobright.com" target="_blank"&gt;Infobright &lt;/a&gt;is that Miriam is no longer CEO and she has been replaced by a temporary CEO, board member Mark Burton.  I spoke with Mark a couple of days ago and the reasons cited were around future direction and the next stage in the company’s lifecycle etc.  They are still sorting this all out and expect to be ready to start discussing their new direction in a few weeks.  In saying that, when we spoke I got the feeling their positioning will still very tied to the MySQL customer base, something I tend to disagree with.  But it would be premature to speculate and instead will wait to further information is available.&lt;br&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=zr9OC2MfnRk:vEBb-bO40SI:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=zr9OC2MfnRk:vEBb-bO40SI:F7zBnMyn0Lo"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?i=zr9OC2MfnRk:vEBb-bO40SI:F7zBnMyn0Lo" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=zr9OC2MfnRk:vEBb-bO40SI:V_sGLiPBpWU"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?i=zr9OC2MfnRk:vEBb-bO40SI:V_sGLiPBpWU" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/TonyBain/~4/zr9OC2MfnRk" height="1" width="1"/&gt;</content>


    </entry>
    <entry>
        <title>The Danger of blocking the Oracle/Sun deal</title>
        <link rel="alternate" type="text/html" href="http://blog.tonybain.com/tony_bain/2009/11/image-via-wikipediafyi---the-thoughts-here-have-been-gathered-from-conversations-with-several-individuals-including-an-inter.html" />
        <link rel="replies" type="text/html" href="http://blog.tonybain.com/tony_bain/2009/11/image-via-wikipediafyi---the-thoughts-here-have-been-gathered-from-conversations-with-several-individuals-including-an-inter.html" thr:count="0" />
        <id>tag:typepad.com,2003:post-6a00d834559d1e69e20120a6584b8d970b</id>
        <published>2009-11-06T10:29:52+11:00</published>
        <updated>2009-11-06T14:24:14+11:00</updated>
        <summary>Image via WikipediaFYI - the thoughts here have been gathered from conversations with several individuals, including an interesting conversation yesterday. As these conversations were off the record I won’t name names here but thanks to those people. I love open...</summary>
        <author>
            <name>Tony Bain</name>
        </author>
        <category scheme="http://www.sixapart.com/ns/types#category" term="Business Intelligence" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Cloud Databases" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Database Management" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Microsoft SQL Server" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="MySQL" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="NoSQL" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Oracle" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Relational DB" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Web 2.0" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Web/Tech" />
        
        <category scheme="http://sixapart.com/ns/types#tag" term="EnterpriseDB" />
        <category scheme="http://sixapart.com/ns/types#tag" term="MySQL" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Open source" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Oracle" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Sun Microsystems" />
        
<content type="html" xml:lang="en-AU" xml:base="http://blog.tonybain.com/tony_bain/">&lt;div xmlns="http://www.w3.org/1999/xhtml"&gt;&lt;p class="zemanta-img" style="margin: 1em; float: right; display: block; width: 310px;"&gt;&lt;a href="http://en.wikipedia.org/wiki/Image:Oracle_Corporation_HQ.jpg"&gt;&lt;img alt="Oracle headquarters" height="200" src="http://upload.wikimedia.org/wikipedia/en/thumb/9/9d/Oracle_Corporation_HQ.jpg/300px-Oracle_Corporation_HQ.jpg" style="border: medium none ; display: block;" width="300"&gt;&lt;/img&gt;&lt;/a&gt;&lt;span class="zemanta-img-attribution"&gt;Image via &lt;a href="http://en.wikipedia.org/wiki/Image:Oracle_Corporation_HQ.jpg"&gt;Wikipedia&lt;/a&gt;&lt;/span&gt;&lt;/p&gt;&lt;em&gt;&lt;span style="font-size: 10px;"&gt;FYI - the thoughts here have been gathered from conversations with several individuals, including an interesting conversation yesterday.  As these conversations were off the record I won’t name names here but thanks to those people.&lt;/span&gt;&lt;/em&gt;&lt;br&gt;&lt;br&gt;I love open source software and I am a big supporter of many companies that produce open source offerings.  Here I am not going to debate if Oracle acquiring MySQL will be better for MySQL or not as that has been done to death.  But I do think it is relevant to discuss the dangers of blocking a commercial vendor from acquiring a potentially competitive open source vendor.&lt;br&gt;&lt;br&gt;Many open source software initiatives are purely community backed and are constructed in an informal, ad-hoc manner.  Many other initiatives are started within large new generation companies to serve their own needs, and then made available for the benefit of the community at large as a side benefit.&lt;br&gt;&lt;br&gt;This way of building software however limits the audience to users who have the necessary technical capability to build, deploy and support that software internally without a dependency on another supporting body (other than the community of course).  To open the software up as an option to a much wider customer base a more formal structure is required.  Typically a company is formed to develop, document, support, promote and rally the community and allow the software to be used in a much greater capacity.&lt;br&gt;&lt;br&gt;But without large license sales bootstrapping an open source company is very difficult.  Instead open source companies often use venture finance as a means of resourcing the company, to grow both the company and the software to some form of critical mass.  In the database world off the top of my head I can think of a bunch of open source companies who have taken this approach (MySQL prior to Sun, &lt;a class="zem_slink" href="http://www.10gen.com/" rel="homepage" title="10gen"&gt;10gen&lt;/a&gt;, &lt;a class="zem_slink" href="http://www.infobright.com" rel="homepage" title="Infobright"&gt;Infobright&lt;/a&gt;, &lt;a class="zem_slink" href="http://www.enterprisedb.com/" rel="homepage" title="EnterpriseDB"&gt;EnterpriseDB&lt;/a&gt; and so on).  &lt;br&gt;&lt;br&gt;Venture finance firms invest to help create significant value, and then create an exit.  IPO’s are unlikely in the database industry in general right now, and less likely for open source database companies.  So the most likely exit is through acquisition.  The number of companies who have the size, ability, direction &amp;amp; motivation to acquire a highly successful venture back database start up (assuming under good exit conditions) I could probably count on my fingers &amp;amp; toes. &lt;br&gt;&lt;br&gt;As dramatic as it sounds, blocking a commercial vendor from acquiring and open source vendor because of product overlaps could have much future impact.  Start ups seeking funding to build any killer app that overlaps with commercial software (of course, not just DB) may find some resistance from investors due to the potential exit issues.  Of course protecting the consumer from anti-competitive behavior is a necessary evil, but we also have to ensure that the system that allows companies like MySQL to come into existence is also protected.&lt;br&gt;&lt;br&gt;&#xD;
&#xD;
&lt;div class="zemanta-pixie" style="margin-top: 10px; height: 15px;"&gt;&lt;a class="zemanta-pixie-a" href="http://reblog.zemanta.com/zemified/7919e15b-67ca-421d-adca-edaf4617a130/" title="Reblog this post [with Zemanta]"&gt;&lt;img alt="Reblog this post [with Zemanta]" class="zemanta-pixie-img " src="http://img.zemanta.com/reblog_e.png?x-id=7919e15b-67ca-421d-adca-edaf4617a130" style="border: medium none ; float: right;"&gt;&lt;/img&gt;&lt;/a&gt;&lt;span class="zem-script more-related pretty-attribution"&gt;&lt;script src="http://static.zemanta.com/readside/loader.js" type="text/javascript"&gt;&lt;/script&gt;&lt;/span&gt;&lt;/div&gt;&lt;/div&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=kAVhVLVwzpw:btLqMv8mn44:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=kAVhVLVwzpw:btLqMv8mn44:F7zBnMyn0Lo"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?i=kAVhVLVwzpw:btLqMv8mn44:F7zBnMyn0Lo" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=kAVhVLVwzpw:btLqMv8mn44:V_sGLiPBpWU"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?i=kAVhVLVwzpw:btLqMv8mn44:V_sGLiPBpWU" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/TonyBain/~4/kAVhVLVwzpw" height="1" width="1"/&gt;</content>


    </entry>
    <entry>
        <title>Back from Hiatus - Summary Update 1</title>
        <link rel="alternate" type="text/html" href="http://blog.tonybain.com/tony_bain/2009/11/back-from-hiatus-summary-update-1.html" />
        <link rel="replies" type="text/html" href="http://blog.tonybain.com/tony_bain/2009/11/back-from-hiatus-summary-update-1.html" thr:count="0" />
        <id>tag:typepad.com,2003:post-6a00d834559d1e69e20120a6579fd2970b</id>
        <published>2009-11-06T06:58:21+11:00</published>
        <updated>2009-11-06T15:50:55+11:00</updated>
        <summary>Here is a summary of the key discussions I have had over the last month. Keep in mind, I’m no analyst. This is largely opinion based on various conversations I have had with the relevant companies (for analyst insight see...</summary>
        <author>
            <name>Tony Bain</name>
        </author>
        <category scheme="http://www.sixapart.com/ns/types#category" term="Business Intelligence" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Cloud Databases" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Data Integration" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Database Management" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Microsoft SQL Server" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="MySQL" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Oracle" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Relational DB" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Web 2.0" />
        
        <category scheme="http://sixapart.com/ns/types#tag" term="Aster Data" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Column-oriented DBMS" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Greenplum" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Kickfire" />
        <category scheme="http://sixapart.com/ns/types#tag" term="MySQL" />
        <category scheme="http://sixapart.com/ns/types#tag" term="RDBMS" />
        
<content type="html" xml:lang="en-AU" xml:base="http://blog.tonybain.com/tony_bain/">&lt;div xmlns="http://www.w3.org/1999/xhtml"&gt;Here is a summary of the key discussions I have had over the last month.  Keep in mind, I’m no analyst.  This is largely opinion based on various conversations I have had with the relevant companies (for analyst insight see &lt;a href="http://www.dbms2.com/" target="_blank"&gt;Curt Monash&lt;/a&gt;).&lt;br&gt;&lt;br&gt;&lt;h2&gt;KickFire&lt;/h2&gt;I think Kickfire has been doing it a little tough lately.  The difficulties in a startup launching a hardware appliance (and associated logistics) combined with being too focused on the MySQL customer base has impacted the growth of this interesting start up.  But they aren’t taking it lying down and have adjusted the strategy and have &lt;a href="http://www.kickfire.com/images/press_releases/Kickfire_3000_Series_Product_Release.pdf" target="_blank"&gt;added a new appliance to the range&lt;/a&gt;.  Kickfire now seems to have a stronger focus on &lt;a href="http://www.kickfire.com/blog/?p=469"&gt;the enterprise&lt;/a&gt; and has released a larger version of its appliance to provide a growth path.  As I have said all along, the MySQL aspect of their product is interesting but the solution as a whole is much more interesting and has much broader appeal than just the current MySQL customer base.&lt;br&gt;&lt;br&gt;Flipping hardware appliances is a much tougher play than software only solutions, partly due to it being much more difficult for customers to get their hands on your stuff and have a play before they buy.  Hopefully Kickfire has mitigated most of these issues now though their online, on demand evaluation host.  I haven’t yet played with this but it is on my list of things to do over the coming month.&lt;br&gt;&lt;br&gt;Kickfire’s enterprise strategy is just one of many that will be re-enforced by an Oracle acquisition of Sun.&lt;br&gt;&lt;br&gt;&lt;h2&gt;Greenplum&lt;/h2&gt;Greenplum has addressed a perceived chink in its amour with the release of its &lt;a href="http://www.greenplum.com/news/248/231/Beyond-Rows-and-Columns-Greenplum-s-Polymorphic-Data-Storage----Part-1/d,blog/" target="_blank"&gt;column store capability&lt;/a&gt;.  Greenplum has taken the popular hybrid approach which means on a case by case basis you can decide if a particular table should be row or column orientated.  But as &lt;a href="http://dbmsmusings.blogspot.com/2009/10/greenplum-announces-column-oriented.html" target="_blank"&gt;Daniel points out&lt;/a&gt;, it is a storage level only solution.  The storage only approach brings just part of the benefit of columnar stores, to achieve the full benefit the query execution engine needs to be aware of this layout (so features such as lightweight compression can be effectively used).  But I am sure this is an area where Greenplum will make further improvements in the future.&lt;br&gt;&lt;br&gt;&lt;h2&gt;Groovy&lt;/h2&gt;Groovy has been working hard carving out its niche in the real time web data market.  If you don’t recall, Groovy makes an in-memory RDBMS that has been extended to provide real time data streaming capabilities.  Groovy has been positioning this into the large web properties who are working on creating new large scale, real time applications for their user base.&lt;br&gt;&lt;br&gt;&lt;h2&gt;Aster Data&lt;/h2&gt;Aster has put out a number of announcements over the last month and I am trying to keep up.  Firstly they announced their tight integration with Hadoop.  This integration with Hadoop is map-reduce on the outside of the Aster Data platform (which apparently they didn’t have already although I think everyone assumed they did given their strong in database map-reduce message).  Aster has been banging the map-reduce drum for some time and is clearly the point of difference they are focusing on.  &lt;br&gt;&lt;br&gt;Aster has also release version 4.0 of their platform a couple of days ago, then a few days ago I was a bit surprised to see an email from them referring to their platform as “&lt;a href="http://www.asterdata.com/news/091102-Aster-Data-4.0-Massively-Parallel-Data-Application-Server.php" target="_blank"&gt;the World's First Massively Parallel Data-Application Server&lt;/a&gt;”.  This seems to be a new name reference to the in database map-reduce stuff, maybe as an effort to differentiate themselves from the myriad of competitors in this space they are trying to carve out a new category all for themselves.  For me, the external map-reduce stuff makes sense as I can see this&#xD;
being useful for data preparation on the way in to Aster and data&#xD;
dissemination of data on its way out of Aster.  But I still don’t have&#xD;
in my head clear examples when their in database map-reduce stuff is&#xD;
useful.  I am sure it is but I have a feeling it is valuable on a case&#xD;
by case basis which is difficult to articulate especially as a point of&#xD;
difference message.  But I missed Curt’s map-reduce webinar (at the&#xD;
last minute) so maybe that would have shed some light.  Anyway, they are running a webinar on this which you can &lt;a href="http://www.asterdata.com/wp_Aster_Data_4.0_Applications_Within/" target="_blank"&gt;register for here&lt;/a&gt;.&lt;br&gt;&lt;br&gt;&lt;p&gt;To me, Aster is more aggressively driving their platform into green fields trying to leverage their technology to find new customers and new markets.  Greenplum on the other hand is more ‘steady as she goes’, focusing on a more traditional and conservative enterprise data warehousing market (while still innovating ahead of the general purpose behemoth's).  The risks are on both sides.  When trying to define a new market you risk not finding one or finding one that is too small or “niche” to support your business.  With the conservative approach you risk being lumped in with everyone else, and in data warehousing ‘everyone else’ is now quite a long list.  &lt;/p&gt;&lt;p&gt;&lt;a href="http://blog.tonybain.com/tony_bain/2009/11/back-from-hiatus-summary-update-2.html"&gt;&amp;gt;&amp;gt; part 2 &lt;/a&gt;&lt;/p&gt;&#xD;
&#xD;
&lt;div class="zemanta-pixie" style="margin-top: 10px; height: 15px;"&gt;&lt;a class="zemanta-pixie-a" href="http://reblog.zemanta.com/zemified/5c1dac80-ac64-4f22-a3be-d94e71c3faaf/" title="Reblog this post [with Zemanta]"&gt;&lt;img alt="Reblog this post [with Zemanta]" class="zemanta-pixie-img " src="http://img.zemanta.com/reblog_e.png?x-id=5c1dac80-ac64-4f22-a3be-d94e71c3faaf" style="border: medium none ; float: right;"&gt;&lt;/img&gt;&lt;/a&gt;&lt;span class="zem-script more-related pretty-attribution"&gt;&lt;script src="http://static.zemanta.com/readside/loader.js" type="text/javascript"&gt;&lt;/script&gt;&lt;/span&gt;&lt;/div&gt;&lt;/div&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=5m-2xZi2TgM:Lar5llcEhVY:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=5m-2xZi2TgM:Lar5llcEhVY:F7zBnMyn0Lo"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?i=5m-2xZi2TgM:Lar5llcEhVY:F7zBnMyn0Lo" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=5m-2xZi2TgM:Lar5llcEhVY:V_sGLiPBpWU"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?i=5m-2xZi2TgM:Lar5llcEhVY:V_sGLiPBpWU" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/TonyBain/~4/5m-2xZi2TgM" height="1" width="1"/&gt;</content>


    </entry>
    <entry>
        <title>Blogging Hiatus</title>
        <link rel="alternate" type="text/html" href="http://blog.tonybain.com/tony_bain/2009/11/blogging-hiatus.html" />
        <link rel="replies" type="text/html" href="http://blog.tonybain.com/tony_bain/2009/11/blogging-hiatus.html" thr:count="0" />
        <id>tag:typepad.com,2003:post-6a00d834559d1e69e20120a6acc494970c</id>
        <published>2009-11-06T05:35:08+11:00</published>
        <updated>2009-11-06T05:35:08+11:00</updated>
        <summary>Image via WikipediaI have been on a bit of a blogging hiatus the last month. No specific reason for this other than being very busy and travelling a lot. During this time I have had a lot of interesting calls...</summary>
        <author>
            <name>Tony Bain</name>
        </author>
        
        
<content type="html" xml:lang="en-AU" xml:base="http://blog.tonybain.com/tony_bain/">&lt;div xmlns="http://www.w3.org/1999/xhtml"&gt;&lt;p class="zemanta-img" style="margin: 1em; float: right; display: block; width: 310px;"&gt;&lt;a href="http://commons.wikipedia.org/wiki/Image:SJPan.jpg"&gt;&lt;img alt="City of San Jose" height="103" src="http://upload.wikimedia.org/wikipedia/commons/thumb/3/3f/SJPan.jpg/300px-SJPan.jpg" style="border: medium none ; display: block;" width="300"&gt;&lt;/img&gt;&lt;/a&gt;&lt;span class="zemanta-img-attribution"&gt;Image via &lt;a href="http://commons.wikipedia.org/wiki/Image:SJPan.jpg"&gt;Wikipedia&lt;/a&gt;&lt;/span&gt;&lt;/p&gt;I have been on a bit of a blogging hiatus the last month.  No specific reason for this other than being very busy and travelling a lot.  During this time I have had a lot of interesting calls and I spent most of last week in Silicon Valley so there is much to write about.  Over the next few posts I will try and get back up to date.&lt;br&gt;&#xD;
&#xD;
&lt;div class="zemanta-pixie" style="margin-top: 10px; height: 15px;"&gt;&lt;a class="zemanta-pixie-a" href="http://reblog.zemanta.com/zemified/f6f35c87-0745-400b-ab89-3f28172db69c/" title="Reblog this post [with Zemanta]"&gt;&lt;img alt="Reblog this post [with Zemanta]" class="zemanta-pixie-img " src="http://img.zemanta.com/reblog_e.png?x-id=f6f35c87-0745-400b-ab89-3f28172db69c" style="border: medium none ; float: right;"&gt;&lt;/img&gt;&lt;/a&gt;&lt;span class="zem-script more-related pretty-attribution"&gt;&lt;script defer="defer" src="http://static.zemanta.com/readside/loader.js" type="text/javascript"&gt;&lt;/script&gt;&lt;/span&gt;&lt;/div&gt;&lt;/div&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=v5zAS9-kcD8:6nQAwTNy1KU:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=v5zAS9-kcD8:6nQAwTNy1KU:F7zBnMyn0Lo"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?i=v5zAS9-kcD8:6nQAwTNy1KU:F7zBnMyn0Lo" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=v5zAS9-kcD8:6nQAwTNy1KU:V_sGLiPBpWU"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?i=v5zAS9-kcD8:6nQAwTNy1KU:V_sGLiPBpWU" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/TonyBain/~4/v5zAS9-kcD8" height="1" width="1"/&gt;</content>


    </entry>
    <entry>
        <title>DBMS Links of the Week</title>
        <link rel="alternate" type="text/html" href="http://blog.tonybain.com/tony_bain/2009/09/dbms-links-of-the-week.html" />
        <link rel="replies" type="text/html" href="http://blog.tonybain.com/tony_bain/2009/09/dbms-links-of-the-week.html" thr:count="0" />
        <id>tag:typepad.com,2003:post-6a00d834559d1e69e20120a59b0a66970b</id>
        <published>2009-09-26T08:46:34+10:00</published>
        <updated>2009-09-26T08:46:34+10:00</updated>
        <summary>Image by plαdys via Flickr The following is a list of interesting DBMS related links for the week: Ellison's Impatience Over Sun Intel squeezes one million IOPS from desktop Is the RDBMS doomed (yada yada yada) ? EDS brand is...</summary>
        <author>
            <name>Tony Bain</name>
        </author>
        <category scheme="http://www.sixapart.com/ns/types#category" term="Business Intelligence" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Cloud Databases" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Database Management" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Microsoft SQL Server" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="MySQL" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="NoSQL" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Oracle" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Relational DB" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Web/Tech" />
        
        <category scheme="http://sixapart.com/ns/types#tag" term="Database" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Database management system" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Relational" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Relational database" />
        
<content type="html" xml:lang="en-AU" xml:base="http://blog.tonybain.com/tony_bain/">&lt;div xmlns="http://www.w3.org/1999/xhtml"&gt;&lt;p class="zemanta-img" style="margin: 1em; float: right; display: block; width: 170px;"&gt;&lt;a href="http://www.flickr.com/photos/85169589@N00/2899452791"&gt;&lt;img alt="Larry Ellison" height="240" src="http://farm4.static.flickr.com/3282/2899452791_577f058dc7_m.jpg" style="border: medium none ; display: block;" width="160"&gt;&lt;/img&gt;&lt;/a&gt;&lt;span class="zemanta-img-attribution"&gt;Image by &lt;a href="http://www.flickr.com/photos/85169589@N00/2899452791"&gt;plαdys&lt;/a&gt; via Flickr&lt;/span&gt;&lt;/p&gt;&lt;p&gt;The following is a list of interesting DBMS related links for the week:&lt;/p&gt;&lt;ul&gt;&#xD;
&lt;li style="font-family: inherit;"&gt;&lt;a href="http://www.businessweek.com/the_thread/techbeat/archives/2009/09/toward_the_end.html" target="_blank"&gt;Ellison's Impatience Over Sun&lt;/a&gt;&lt;/li&gt;&#xD;
&lt;li style="font-family: inherit;"&gt;&lt;a href="http://www.theregister.co.uk/2009/09/23/insane_ssd_performance/" target="_blank"&gt;Intel squeezes one million IOPS from desktop&lt;/a&gt;&lt;/li&gt;&#xD;
&lt;li style="font-family: inherit;"&gt;&lt;a href="http://blog.tonybain.com/tony_bain/2009/09/the-rdbms-is-doomed-yada-yada-yada.html" target="_blank"&gt;Is the RDBMS doomed (yada yada yada) ?&lt;/a&gt;&lt;/li&gt;&#xD;
&lt;li style="font-family: inherit;"&gt;&lt;a href="http://www.itnews.com.au/News/156598,eds-brand-is-no-more.aspx" target="_blank"&gt;EDS brand is no more (not DBMS but interesting)&lt;/a&gt;&lt;/li&gt;&#xD;
&lt;/ul&gt;&#xD;
&lt;br&gt;&lt;br&gt;&lt;fieldset class="zemanta-related"&gt;&lt;legend class="zemanta-related-title"&gt;Related articles by Zemanta&lt;/legend&gt;&lt;ul class="zemanta-article-ul"&gt;&lt;li class="zemanta-article-ul-li"&gt;&lt;a href="http://ducknetweb.blogspot.com/2009/09/larry-ellison-on-oracle-wants-to-be-ibm.html"&gt;Larry Ellison on Oracle - Wants to be IBM, T.J. Watson's IBM&lt;/a&gt; (ducknetweb.blogspot.com)&lt;/li&gt;&#xD;
&lt;/ul&gt;&#xD;
&lt;/fieldset&gt;&#xD;
&#xD;
&lt;div class="zemanta-pixie" style="margin-top: 10px; height: 15px;"&gt;&lt;a class="zemanta-pixie-a" href="http://reblog.zemanta.com/zemified/e54eba23-601c-47b3-a4ee-9fc0f51d715d/" title="Reblog this post [with Zemanta]"&gt;&lt;img alt="Reblog this post [with Zemanta]" class="zemanta-pixie-img" src="http://img.zemanta.com/reblog_e.png?x-id=e54eba23-601c-47b3-a4ee-9fc0f51d715d" style="border: medium none ; float: right;"&gt;&lt;/img&gt;&lt;/a&gt;&lt;span class="zem-script more-related pretty-attribution"&gt;&lt;script defer="defer" src="http://static.zemanta.com/readside/loader.js" type="text/javascript"&gt;&lt;/script&gt;&lt;/span&gt;&lt;/div&gt;&lt;/div&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=9Sbrrb8v11I:LyBv7tb8UDg:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=9Sbrrb8v11I:LyBv7tb8UDg:F7zBnMyn0Lo"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?i=9Sbrrb8v11I:LyBv7tb8UDg:F7zBnMyn0Lo" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=9Sbrrb8v11I:LyBv7tb8UDg:V_sGLiPBpWU"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?i=9Sbrrb8v11I:LyBv7tb8UDg:V_sGLiPBpWU" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/TonyBain/~4/9Sbrrb8v11I" height="1" width="1"/&gt;</content>


    </entry>
    <entry>
        <title>Is the RDBMS doomed (yada yada yada) ?</title>
        <link rel="alternate" type="text/html" href="http://blog.tonybain.com/tony_bain/2009/09/the-rdbms-is-doomed-yada-yada-yada.html" />
        <link rel="replies" type="text/html" href="http://blog.tonybain.com/tony_bain/2009/09/the-rdbms-is-doomed-yada-yada-yada.html" thr:count="0" />
        <id>tag:typepad.com,2003:post-6a00d834559d1e69e20120a58a0ec2970b</id>
        <published>2009-09-22T09:03:00+10:00</published>
        <updated>2009-09-22T09:12:14+10:00</updated>
        <summary>Image by Snooch2TheNooch via Flickr I was speaking with Michael Stonebraker this morning. I mentioned that lately many have been referencing comments he has made over the last couple of years. And I also mentioned that many had interpreted them...</summary>
        <author>
            <name>Tony Bain</name>
        </author>
        <category scheme="http://www.sixapart.com/ns/types#category" term="Business Intelligence" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Cloud Databases" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Data Integration" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Database Management" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Microsoft SQL Server" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="MySQL" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="NoSQL" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Oracle" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Relational DB" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Startups" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Web 2.0" />
        
        <category scheme="http://sixapart.com/ns/types#tag" term="Database" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Michael Stonebraker" />
        <category scheme="http://sixapart.com/ns/types#tag" term="MPP" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Relational" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Relational database" />
        <category scheme="http://sixapart.com/ns/types#tag" term="SQL" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Transaction processing" />
        
<content type="html" xml:lang="en-AU" xml:base="http://blog.tonybain.com/tony_bain/">&lt;div xmlns="http://www.w3.org/1999/xhtml"&gt;&lt;p class="zemanta-img" style="margin: 1em; float: right; display: block; width: 190px;"&gt;&lt;a href="http://www.flickr.com/photos/36680989@N04/3459491112"&gt;&lt;img alt="Ladybower Plughole" src="http://farm4.static.flickr.com/3553/3459491112_562f29d3f0_m.jpg" style="border: medium none ; display: block;"&gt;&lt;/img&gt;&lt;/a&gt;&lt;span class="zemanta-img-attribution"&gt;Image by &lt;a href="http://www.flickr.com/photos/36680989@N04/3459491112"&gt;Snooch2TheNooch&lt;/a&gt; via Flickr&lt;/span&gt;&lt;/p&gt;&lt;p&gt;I was speaking with &lt;a href="http://en.wikipedia.org/wiki/Michael_Stonebraker" target="_blank"&gt;Michael Stonebraker&lt;/a&gt; this morning.  I mentioned that lately many have been &lt;a href="http://cacm.acm.org/blogs/blog-cacm/32212-the-end-of-a-dbms-era-might-be-upon-us/fulltext" target="_blank"&gt;referencing comments&lt;/a&gt; he has made over the last couple of years.  And I also mentioned that many had interpreted them as he was implying the RDBMS is “doomed”.  Mike has been saying the same thing for years, but the current NoSQL movement seems to have picked up on this and highlighting one of the RDBMS's own pioneers &lt;a href="http://www.infoq.com/news/2009/08/NoSQL-and-the-End-of-RDBMS-Era" target="_blank"&gt;is predicting its demise&lt;/a&gt;.&lt;/p&gt;&lt;p&gt;I asked Mike to clarify this.  My interpretation of his response is as follows.  I understand that he doesn’t believe the relational database itself is doomed.  Instead the current general purpose implementations, or “elephants” using his words, were out of date.  By moving away from a historical GP function into something more specific in focus, either in transaction processing or analytics, you can easily get 50x performance improvement over GP RDBMS.  This doesn’t necessarily mean moving away from the “relational” nature, but instead changing some core design principles for how a RDBMS is implemented.  It is this improvement factor that will see “new” specialist platforms overtake “old” general purpose platforms.  That is gradually, over time.  However Mike also mentioned the relational data model doesn’t make sense in a number of disciplines, particularly in sciences, and alternative modeling paradigms will offer benefits to this market (hence his focus on &lt;a href="http://scidb.org/" target="_blank"&gt;SciDB&lt;/a&gt;).  So while relational is a valid data model, other data models are also needed.&lt;/p&gt;&lt;p&gt;I have a similar position to Mike, but perhaps with a few differences.  &lt;/p&gt;&lt;p&gt;- Firstly I agree with the mantra that current GP RDBMS platforms provide only a “middle of the road” capability, and we gone too far in using a GP RDBMS for everything.  However I do believe there is a long term future for the GP RDBMS.  A general purpose application requirement will continued to be well suited for a general purpose platform.  With a specialist only approach, a general purpose requirement may need both a specialist OLTP platform and a specialist Analytics platform to provide the same capability.&lt;/p&gt;&lt;p&gt;- I agree that with an extreme requirement, either analytics or transaction processing, a specialist platform is well suited.  But I don’t see the choices of just MPP or memory resident RBDMS as being a broad enough set.  Apps that use a db just as a persistence cache will benefit from a high performing, scalable database platform with much tighter integration with the object model.  I am not sure any of the current NoSQL platforms have it quite right yet, but when these guys eventually get together with the database guys and work on these things together they may get there.&lt;/p&gt;&lt;p&gt;- I don’t think a 50x performance speed up on its own is enough to drive change in OLTP.  I have &lt;a href="http://blog.tonybain.com/tony_bain/2009/07/positioning-your-database-start-up-for-enterprise-oltp.html" target="_blank"&gt;written before&lt;/a&gt; how difficult it is to get into this market and how tight Oracle, Microsoft &amp;amp; IBM have this sewn up.  But I don’t believe it is impossible, I think you just need to bring slam dunks on multiple fronts (performance just being one of them).&lt;/p&gt;&lt;p&gt;Anyway I feel like I am a bit of a broken record at the moment.  I have been addressing the “is the RDBMS doomed” question a couple of times a day for some time. Time to focus on something else for a bit.&lt;/p&gt;&lt;br&gt;&#xD;
&#xD;
&lt;div class="zemanta-pixie" style="margin-top: 10px; height: 15px;"&gt;&lt;a class="zemanta-pixie-a" href="http://reblog.zemanta.com/zemified/3240b67b-7d7a-48c8-9fe1-18ff45e8906c/" title="Reblog this post [with Zemanta]"&gt;&lt;img alt="Reblog this post [with Zemanta]" class="zemanta-pixie-img " src="http://img.zemanta.com/reblog_e.png?x-id=3240b67b-7d7a-48c8-9fe1-18ff45e8906c" style="border: medium none ; float: right;"&gt;&lt;/img&gt;&lt;/a&gt;&lt;span class="zem-script more-related pretty-attribution"&gt;&lt;script src="http://static.zemanta.com/readside/loader.js" type="text/javascript"&gt;&lt;/script&gt;&lt;/span&gt;&lt;/div&gt;&lt;/div&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=dBUjBZeeTtk:hdnQZ9vXCiQ:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=dBUjBZeeTtk:hdnQZ9vXCiQ:F7zBnMyn0Lo"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?i=dBUjBZeeTtk:hdnQZ9vXCiQ:F7zBnMyn0Lo" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=dBUjBZeeTtk:hdnQZ9vXCiQ:V_sGLiPBpWU"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?i=dBUjBZeeTtk:hdnQZ9vXCiQ:V_sGLiPBpWU" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/TonyBain/~4/dBUjBZeeTtk" height="1" width="1"/&gt;</content>


    </entry>
    <entry>
        <title>Some Initial Thoughts on Oracle Exadata V2</title>
        <link rel="alternate" type="text/html" href="http://blog.tonybain.com/tony_bain/2009/09/some-initial-thoughts-on-oracle-exadata-v2.html" />
        <link rel="replies" type="text/html" href="http://blog.tonybain.com/tony_bain/2009/09/some-initial-thoughts-on-oracle-exadata-v2.html" thr:count="0" />
        <id>tag:typepad.com,2003:post-6a00d834559d1e69e20120a5c8e673970c</id>
        <published>2009-09-16T08:48:10+10:00</published>
        <updated>2009-09-16T09:04:29+10:00</updated>
        <summary>Image via Wikipedia There will be plenty of detailed coverage on Exadata V2 so I won’t attempt to replicate that. However I do have a couple of initial thoughts which I would like to share. For those who missed it,...</summary>
        <author>
            <name>Tony Bain</name>
        </author>
        <category scheme="http://www.sixapart.com/ns/types#category" term="Business Intelligence" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Cloud Databases" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Database Management" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Microsoft SQL Server" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="MySQL" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Oracle" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Relational DB" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Web 2.0" />
        
        <category scheme="http://sixapart.com/ns/types#tag" term="Database" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Flash memory" />
        <category scheme="http://sixapart.com/ns/types#tag" term="FlashFire" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Microsoft" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Oracle" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Oracle Database" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Sun" />
        
<content type="html" xml:lang="en-AU" xml:base="http://blog.tonybain.com/tony_bain/">&lt;div xmlns="http://www.w3.org/1999/xhtml"&gt;&lt;p class="zemanta-img" style="margin: 1em; float: right; display: block; width: 310px;"&gt;&lt;a href="http://en.wikipedia.org/wiki/Image:Oracle_logo.svg"&gt;&lt;img alt="Oracle Corporation" height="43" src="http://upload.wikimedia.org/wikipedia/en/thumb/5/50/Oracle_logo.svg/300px-Oracle_logo.svg.png" style="border: medium none ; display: block;" width="300"&gt;&lt;/img&gt;&lt;/a&gt;&lt;span class="zemanta-img-attribution"&gt;Image via &lt;a href="http://en.wikipedia.org/wiki/Image:Oracle_logo.svg"&gt;Wikipedia&lt;/a&gt;&lt;/span&gt;&lt;/p&gt;&lt;p&gt;There will be plenty of detailed coverage on &lt;a href="http://www.oracle.com/us/corporate/press/033684" target="_blank"&gt;Exadata V2&lt;/a&gt; so I won’t attempt to replicate that.  However I do have a couple of initial thoughts which I would like to share.  For those who missed it, Oracle has just announced Exadata V2 (which is their pre-built “machine”).  Exadata V1 was built using HP equipment, Exadata V2 is using Sun.  The main addition to Exadata V2 seems to be an extra tier in the memory hierarchy, a flash cache.  Oracle is very quick to point out this is not flash disk, but it is flash memory, Sun’s FlashFire technology (flash disk or SSD’s was always going to be a transition technology, flash memory doesn’t have the physical constraints of moving parts disk so the whole “disk” concept for flash doesn’t make too much sense other than it fits easily with current architectures).&lt;/p&gt;&lt;p&gt;The new memory layer (Processor Cache’s -&amp;gt; DRAM -&amp;gt; Flash Cache -&amp;gt; Disk) coupled with Oracle’s algorithms to effectively use the Flash Cache layer brings performance benefit to the solution (+ all the other improvements 12 months of hardware innovation brings, faster CPU’s, more memory etc).&lt;/p&gt;&lt;p&gt;My initial thoughts are:&lt;/p&gt;&lt;ul&gt;&#xD;
&lt;li&gt;Kudos to Oracle.  They are the first vendor to really bring a bunch of this leading edge technology together in a semi-mainstream way.  Flash Cache, Inifiband interconnects, DBMS optimizations using flash hasn't really surfaced anywhere outside of startups yet.&lt;/li&gt;&#xD;
&lt;li&gt;So what happens to Exadata V1 customers using the HP solution?  This is only about a year old.  Some analysts are suggesting there has only been minor sales of Exadata V1 (I am not an analyst so don’t really know).  So why would HP continue to support a platform where no new sales will be created, when potentially only a limited number of customers have it today?  Possibly Oracle will offer attractive terms to move existing HP Exadata V1 customers to Sun Exadata V2.&lt;/li&gt;&#xD;
&lt;li&gt;It is a preconfigured solution that you by in certain size configurations.  Small, half rack, full rack, multiple racks.  I think Larry said that 3 racks will give you a PetaByte of storage capacity.  This is fine, except they are targeting it for use with OLTP and data warehousing workloads.  It seems odd that to get very high computational resources for transaction processing, you would also get massive volumes of potentially unnecessary storage capacity.  It will be interesting to see if they allow the balance between processing &amp;amp; storage to be modified as part of configuration.&lt;/li&gt;&#xD;
&lt;/ul&gt;&#xD;
&lt;p&gt;&lt;br&gt;I have had some questions along the lines of “isn’t this back to the one size fits all approach?”  Well yes it is, but Oracle never really moved away from this in terms of the core DBMS.  It is my understanding that Oracle Exadata was still the general purpose Oracle DBMS &amp;amp; RAC but on a hardware platform optimized for accessing large data sets (making it a data warehousing solution).  Using FlashFire, the hardware can now do high levels of random I/O (I think 1m random I/O’s was quoted) which makes the hardware platform general purpose as well.&lt;/p&gt;&lt;p&gt;One interesting question will be if, under Oracle, other vendors can buy the exact same hardware configuration from Sun and optimize their DBMS for Flash also?   If so, it may be difficult for them to do this in a way that is price competitive.  And will competitive DBMS vendors really want to help fill Oracle’s pockets further?&lt;/p&gt;&lt;p&gt;If we expect to see more of this hardware alignment between DBMS vendors where does that leave Microsoft?  Maybe HP is already peeling the Exadata V1 logos off their racks and sticking Microsoft Madison logo’s in their place?&lt;/p&gt;&lt;p&gt;&lt;em&gt;UPDATE:&lt;/em&gt;&lt;/p&gt;&lt;p&gt;Oracle has put out a &lt;a href="http://www.oracle.com/technology/products/bi/db/exadata/exadata-faq.html" target="_blank"&gt;FAQ &lt;/a&gt;which partly answers some of the questions.&lt;/p&gt;&lt;br&gt;&#xD;
&#xD;
&lt;div class="zemanta-pixie" style="margin-top: 10px; height: 15px;"&gt;&lt;a class="zemanta-pixie-a" href="http://reblog.zemanta.com/zemified/05f16aef-3e9d-4ed4-a95d-9bb25ccf1f25/" title="Reblog this post [with Zemanta]"&gt;&lt;img alt="Reblog this post [with Zemanta]" class="zemanta-pixie-img " src="http://img.zemanta.com/reblog_e.png?x-id=05f16aef-3e9d-4ed4-a95d-9bb25ccf1f25" style="border: medium none ; float: right;"&gt;&lt;/img&gt;&lt;/a&gt;&lt;span class="zem-script more-related pretty-attribution"&gt;&lt;script src="http://static.zemanta.com/readside/loader.js" type="text/javascript"&gt;&lt;/script&gt;&lt;/span&gt;&lt;/div&gt;&lt;/div&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=obt9fO74Eak:p9hcWfl7QZc:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=obt9fO74Eak:p9hcWfl7QZc:F7zBnMyn0Lo"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?i=obt9fO74Eak:p9hcWfl7QZc:F7zBnMyn0Lo" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=obt9fO74Eak:p9hcWfl7QZc:V_sGLiPBpWU"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?i=obt9fO74Eak:p9hcWfl7QZc:V_sGLiPBpWU" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/TonyBain/~4/obt9fO74Eak" height="1" width="1"/&gt;</content>


    </entry>
    <entry>
        <title>OLTP back into focus</title>
        <link rel="alternate" type="text/html" href="http://blog.tonybain.com/tony_bain/2009/09/oltp-back-into-focus.html" />
        <link rel="replies" type="text/html" href="http://blog.tonybain.com/tony_bain/2009/09/oltp-back-into-focus.html" thr:count="0" />
        <id>tag:typepad.com,2003:post-6a00d834559d1e69e20120a5c1469c970c</id>
        <published>2009-09-14T09:55:25+10:00</published>
        <updated>2009-09-14T09:55:25+10:00</updated>
        <summary>I haven’t blogged in over a month now. This is for a number of reasons. Firstly I have been flat out with various activities. This included a trip to VLDB in Lyon mid month. Secondly, a lot of the companies...</summary>
        <author>
            <name>Tony Bain</name>
        </author>
        <category scheme="http://www.sixapart.com/ns/types#category" term="Business Intelligence" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Cloud Databases" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Database Management" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="MySQL" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Oracle" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Relational DB" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Startups" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Web/Tech" />
        
        <category scheme="http://sixapart.com/ns/types#tag" term="Database" />
        <category scheme="http://sixapart.com/ns/types#tag" term="OLTP" />
        <category scheme="http://sixapart.com/ns/types#tag" term="RDBMS" />
        <category scheme="http://sixapart.com/ns/types#tag" term="transaction processing" />
        
<content type="html" xml:lang="en-AU" xml:base="http://blog.tonybain.com/tony_bain/">&lt;div xmlns="http://www.w3.org/1999/xhtml"&gt;&lt;p&gt;I haven’t blogged in over a month now.  This is for a number of reasons.  Firstly I have been flat out with various activities.  This included a trip to VLDB in Lyon mid month.  Secondly, a lot of the companies I have spoken with this month aren’t ready to speak publically so hence no blog posts resulting from these sorts of discussions.&lt;/p&gt;&lt;p&gt;&lt;img src="http://vldb2009.org/photos/Tuesday/images/tuesday25august_049.jpg"&gt;&lt;/img&gt;&lt;/p&gt;&lt;p&gt;However there has been a wiff of a change in the air in terms of focus that is interesting and worth highlighting.  After years of lots of innovation around data analytics, OLTP is starting to make a comeback in terms of reclaiming some of the limelight.  Much more on this between now and the end of the year, but a couple things to watch:&lt;/p&gt;&lt;ul&gt;&#xD;
&lt;li style="font-family: inherit;"&gt;&lt;a href="http://www.boston.com/business/technology/innoeco/2009/08/on_the_radar_voltdb_just_the_l.html" target="_blank"&gt;On the Radar: VoltDB&lt;/a&gt;&lt;/li&gt;&#xD;
&lt;li style="font-family: inherit;"&gt;&lt;a href="http://www.sun.com/featured-articles/2009-0911/feature/index.jsp" target="_blank"&gt;Oracle announces OLTP database machine with Sun's FlashFire technology&lt;/a&gt;&lt;/li&gt;&#xD;
&lt;/ul&gt;&lt;/div&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=6iRmN-wobuk:am7eTmJflqk:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=6iRmN-wobuk:am7eTmJflqk:F7zBnMyn0Lo"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?i=6iRmN-wobuk:am7eTmJflqk:F7zBnMyn0Lo" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=6iRmN-wobuk:am7eTmJflqk:V_sGLiPBpWU"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?i=6iRmN-wobuk:am7eTmJflqk:V_sGLiPBpWU" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/TonyBain/~4/6iRmN-wobuk" height="1" width="1"/&gt;</content>


    </entry>
    <entry>
        <title>VectorWise</title>
        <link rel="alternate" type="text/html" href="http://blog.tonybain.com/tony_bain/2009/08/vectorwise.html" />
        <link rel="replies" type="text/html" href="http://blog.tonybain.com/tony_bain/2009/08/vectorwise.html" thr:count="0" />
        <id>tag:typepad.com,2003:post-6a00d834559d1e69e20115715a89ad970c</id>
        <published>2009-08-01T10:33:57+10:00</published>
        <updated>2009-08-01T18:50:47+10:00</updated>
        <summary>I was fortunate enough to speak with Marcin Zukowski earlier about VectorWise. If you missed it, VectorWise came out of stealth mode a day or two ago. The have announced a joint partnership with Ingres and essentially are claiming impressive...</summary>
        <author>
            <name>Tony Bain</name>
        </author>
        <category scheme="http://www.sixapart.com/ns/types#category" term="Business Intelligence" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Cloud Databases" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Data Integration" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Database Management" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Microsoft SQL Server" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="MySQL" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Oracle" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Relational DB" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Startups" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Web 2.0" />
        <category scheme="http://www.sixapart.com/ns/types#category" term="Web/Tech" />
        
        <category scheme="http://sixapart.com/ns/types#tag" term="Ingres" />
        <category scheme="http://sixapart.com/ns/types#tag" term="MonetDB" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Open source" />
        <category scheme="http://sixapart.com/ns/types#tag" term="RDBMS" />
        <category scheme="http://sixapart.com/ns/types#tag" term="Relational database" />
        <category scheme="http://sixapart.com/ns/types#tag" term="VectorWise" />
        
<content type="html" xml:lang="en-AU" xml:base="http://blog.tonybain.com/tony_bain/">&lt;div xmlns="http://www.w3.org/1999/xhtml"&gt;&lt;p&gt;&lt;img src="http://www.vectorwise.com/images/logo_vectorwise.png"&gt;&lt;/img&gt;&#xD;
&lt;br&gt;I was fortunate enough to speak with &lt;a href="http://homepages.cwi.nl/%7Emarcin/" target="_blank"&gt;Marcin Zukowski&lt;/a&gt; earlier about &lt;a href="http://www.vectorwise.com" target="_blank"&gt;VectorWise&lt;/a&gt;.  If you missed it, VectorWise came out of stealth mode a day or two ago.  The have announced a joint &lt;a href="http://www.ingres.com/vectorwise/index.php" target="_blank"&gt;partnership with Ingres&lt;/a&gt; and essentially are claiming impressive analytic RDBMS performance gains on conventional hardware.&lt;/p&gt;&lt;p&gt;To start with, a key message that I think needs to be communicated here is that this is not a product announcement.  Ingres and VectorWise have announced a partnership in which they of course plan to build products together, today those products are still in the works.&lt;/p&gt;&lt;p&gt;VectorWise is a spin out of &lt;a href="http://www.cwi.nl/" target="_blank"&gt;CWI &lt;/a&gt;based on research that was undertaken by Marcin and others, research that centered on &lt;a href="http://monetdb.cwi.nl/" target="_blank"&gt;MonetDB&lt;/a&gt;.  Explaining the essence of VectorWise is difficult because it is largely internal DBMS data storage &amp;amp; processing logic, but I will have a go.&lt;/p&gt;&lt;p&gt;The modern RDBMS is based around design principles that stem from general purpose OLTP roots and historical hardware architectures (this is partially true even for some of the newest analytic platforms).  These design principles in a nutshell focus on the fact that disk is slow &amp;amp; CPU is fast.  Data is seeked or partially scanned off disk and cached.  Row-by-row (tuple-by-tuple) operators process that data, passing the outcome of each operator to the next as part of a queries execution plan until ultimately producing the result.  &lt;/p&gt;&lt;p&gt;Traditionally I/O is the main bottleneck, so to make the database faster you add more I/O bandwidth.   Today, disk requirements may be up to 100x the actual capacity needs, so many disks are necessary to achieve the I/O bandwidth to provide performance for an analytical RDBMS implementation.  Even though the RBDMS’s may parallelize query operators across cores, this typically works by partitioning data between cores, yet each is still processing on a tuple-by-tuple basis.&lt;/p&gt;&lt;p&gt;Conventional wisdom?  Well maybe.  You see disk is only really “slow” when it is doing random seeks.  Give a disk something sequential to do on the other hand and things are very different.  Modern disks are able to sequentially scan in the range of 150MB per second.  An array of 10 disks should therefore be able to return sequentially read data in the range of 1GB per second.  &lt;/p&gt;&lt;p&gt;When it comes to databases, column based storage has been found to effectively structure data for a) high levels of compression and b) sequential access.  VectorWise makes use of both of these technologies to help it achieve high levels of sequential I/O.  The problem now however is that disk may no longer the bottleneck.  While we can get 1GB a second sequentially off disk relatively easily &amp;amp; cheaply, processing tuple-by-tuple at this rate is very difficult.  As it turns out, a RDBMS’s may only achieve a data processing rate of 50MB a second per CPU core.  This makes the CPU processing limitations a big bottleneck for analytics data sets, assuming the above figures we would need over 20 cores to keep up with 10 disks (and of course CPU cores don’t scalability linearly).&lt;/p&gt;&lt;p&gt;If we step out of the database world for the moment into the world of high end computer games, or high end scientific processing, we find their use of current CPU technology is much more advanced than what we are used to.  They are using new CPU extensions (MMX, SSE, SS2, &lt;a href="http://en.wikipedia.org/wiki/SSE4#SSE4.2"&gt;SSE4.2&lt;/a&gt; etc) to parallize &amp;amp; pipeline computation within a CPU’s core meaning they are processing orders of magnitude more instructions per core that what a traditional RDBMS typically has been able to. The exact details are too low level to discuss here (&lt;a href="http://www.vectorwise.com/index_js.php?page=company_origins" target="_blank"&gt;many of the research papers are available online&lt;/a&gt;) but it is fair to say, modern CPU architectures contain advanced features that to date haven’t effectively been exploited by database vendors.&lt;/p&gt;&lt;p&gt;Enter VectorWise.  Their aim is to marry storage technologies which allow high levels of sequential I/O to occur with query processing logic which is designed for modern CPU architectures.  Rather than process tuple-by-tuple they are processing “vectors”, groups of tuples, leveraging modern CPU extensions and high levels of on-chip cache to allow the CPU to carry out higher data processing throughput.  The result is instead of the 50MB a second in a tuple-by-tuple approach, VectorWise are able to achieve processing rates in the range of 500Mb-1GB a second per core in some situations.  This means processing rates of 8GB a second or more could be possible with relatively low end hardware.&lt;/p&gt;&lt;p&gt;“In some situations” is the key point to stress here, this obviously isn’t a blanket gain that applies to all analytic data sets, workloads and query requirements.  Just what those situations are will be the key to their technologies success, how well it actually applies to real world data sets and queries.  I wouldn’t expect to see too many specific examples on this until a product beta appears.  But the theory is VectorWise can offer high levels of processing capabilities with existing mainstream hardware.  At this point VectorWise isn’t even focusing on MPP instead they are single node focused.  If their scalability claims pan out you can imagine how this could allow a single node solution to be competitive with existing low to mid scale MPP solutions that are based on a more conventional query processing architecture.&lt;/p&gt;&lt;p&gt;This isn’t VectorWise’s only trick up their sleeve.  They are also are leveraging research around column based storage, compression, piggy-backed (shared) scans and so on.  Much of the research that has been adopted by VectorWise is referenced from their web site.&lt;/p&gt;&#xD;
&lt;p&gt;&lt;img alt="" src="http://www.ingres.com/images/ingres-vectorwise-logo.jpg"&gt;&lt;/img&gt;&#xD;
&lt;/p&gt;&lt;p&gt;So VectorWise have impressive technology, so why then partner with Ingres rather than a larger vendor (or going at it alone)?  Marcin offers a few reasons.  Firstly, as academics they feel strongly that open source is cool so this path was greatly preferred over a relationship with a non-open vendor.  Secondly Ingres will allow them to deliver their technology in an uncompromised fashion.  Marcin mentioned that if they had partnered with one of the big three vendors, that vendors existing product strategies and investments would have likely meant their ideas could have only been implemented in partial form.  Ingres on the other hand is going to allow them more of a green field.  And of course, a partnership with Ingres makes sense from a go to market perspective as Ingres already has a worldwide reputation, a global customer base, sales &amp;amp; marketing capabilities etc.&lt;/p&gt;&lt;p&gt;Marcin confirmed that Ingres have an exclusive license to their technology, and first option to acquire them for a certain period of time.  This allows Ingres to really invest in the relationship without the fear of the carpet being pulled out from under them.  &lt;/p&gt;&lt;p&gt;VectorWise clearly are applying innovative research to analytical RBDMS requirements.  But as interesting as the technology sounds, the proof in the pudding will be how well these design principals translate to real-world analytical processing requirements in mainstream product form.  This remains to be seen, but Ingres and their community clearly has high hopes.&lt;/p&gt;&lt;p&gt;VectorWise is clearly differentiated when comparison with a traditional mainstream RDBMS running on mainstream hardware.  However in this current market we have lots of different approaches to the problems described.  &lt;a href="http://www.kickfire.com/" target="_blank"&gt;Kickfire &lt;/a&gt;for example use their own SQL Chip processor to increase data processing rates and other appliance vendors are using FPGAs etc for similar purposes.  The comparison of these different approaches and the relative effectiveness of each approach still need to be examined, however a mainstream hardware approach has obvious benefits.&lt;/p&gt;&lt;br&gt;&lt;fieldset class="zemanta-related"&gt;&lt;legend class="zemanta-related-title"&gt;Related articles by Zemanta&lt;/legend&gt;&lt;ul class="zemanta-article-ul"&gt;&lt;li class="zemanta-article-ul-li"&gt;&lt;a href="http://www.theregister.co.uk/2009/07/29/ingres_vectorwise_datawarehouse/"&gt;Ingres challenges Microsoft's DataAllegro warehouse steal&lt;/a&gt; (theregister.co.uk)&lt;/li&gt;&#xD;
&lt;li class="zemanta-article-ul-li"&gt;&lt;a href="http://dbmsmusings.blogspot.com/2009/07/watch-out-for-vectorwise.html"&gt;Watch out for VectorWise&lt;/a&gt; (dbmsmusings.blogspot.com)&lt;/li&gt;&#xD;
&lt;/ul&gt;&#xD;
&lt;/fieldset&gt;&#xD;
&#xD;
&lt;div class="zemanta-pixie" style="margin-top: 10px; height: 15px;"&gt;&lt;a class="zemanta-pixie-a" href="http://reblog.zemanta.com/zemified/236fc16a-49f7-4b6e-9bb9-0ca78c331e2d/" title="Reblog this post [with Zemanta]"&gt;&lt;img alt="Reblog this post [with Zemanta]" class="zemanta-pixie-img " src="http://img.zemanta.com/reblog_e.png?x-id=236fc16a-49f7-4b6e-9bb9-0ca78c331e2d" style="border: medium none ; float: right;"&gt;&lt;/img&gt;&lt;/a&gt;&lt;span class="zem-script more-related pretty-attribution"&gt;&lt;script src="http://static.zemanta.com/readside/loader.js" type="text/javascript"&gt;&lt;/script&gt;&lt;/span&gt;&lt;/div&gt;&lt;/div&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=Ull68bVQx9U:-EmImyCLjI0:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=Ull68bVQx9U:-EmImyCLjI0:F7zBnMyn0Lo"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?i=Ull68bVQx9U:-EmImyCLjI0:F7zBnMyn0Lo" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/TonyBain?a=Ull68bVQx9U:-EmImyCLjI0:V_sGLiPBpWU"&gt;&lt;img src="http://feeds.feedburner.com/~ff/TonyBain?i=Ull68bVQx9U:-EmImyCLjI0:V_sGLiPBpWU" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/TonyBain/~4/Ull68bVQx9U" height="1" width="1"/&gt;</content>


    </entry>
 
</feed><!-- ph=1 --><!-- nhm:from_kauri -->
