<?xml version="1.0" encoding="UTF-8" ?>
<!--RDF based XML document generated By OpenLink Virtuoso-->
<rdf:RDF xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#">
 <rss:channel xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/weblog/dav/dav-blog-1/">
  <rss:title>OpenLink Community Blog</rss:title>
  <rss:link>http://www.openlinksw.com/weblog/dav/dav-blog-1/</rss:link>
  <rss:description>A Collection of blogs by OpenLink Staff</rss:description>
  <dc:creator xmlns:dc="http://purl.org/dc/elements/1.1/">kidehen@openlinksw.com</dc:creator>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2009-11-23T13:57:22Z</dc:date>
  <rss:items>
   <rdf:Seq>
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/vdb/blog/?date=2009-05-28#1558" />
      <rdf:li rdf:resource="http://www.openlinksw.com/weblog/oerling/?date=2009-05-28#1557" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2009-03-30#1539" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/vdb/blog/?date=2008-12-17#1503" />
      <rdf:li rdf:resource="http://www.openlinksw.com/weblog/oerling/?date=2008-12-17#1502" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/vdb/blog/?date=2008-11-20#1485" />
      <rdf:li rdf:resource="http://www.openlinksw.com/weblog/oerling/?date=2008-11-20#1484" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2008-10-31#1468" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2008-10-24#1461" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2008-09-05#1430" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/vdb/blog/?date=2008-08-06#1410" />
      <rdf:li rdf:resource="http://www.openlinksw.com/weblog/oerling/?date=2008-08-06#1409" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2008-08-03#1408" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/vdb/blog/?date=2008-07-30#1401" />
      <rdf:li rdf:resource="http://www.openlinksw.com/weblog/oerling/?date=2008-07-30#1400" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2007-09-22#1261" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2007-04-01#1175" />
      <rdf:li rdf:resource="http://www.openlinksw.com/weblog/oerling/?date=2007-01-10#1116" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/vdb/blog/?date=2007-01-10#1117" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/vdb/blog/?date=2007-01-09#1110" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2006-09-26#1051" />
      <rdf:li rdf:resource="http://www.openlinksw.com/weblog/oerling/?date=2006-09-25#1112" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2006-05-31#987" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2006-05-05#968" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2006-04-28#965" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2006-04-28#993" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2006-04-11#951" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2006-03-14#939" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2006-02-22#936" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2006-01-18#924" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2006-01-11#922" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2005-11-16#904" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2005-10-26#882" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2005-04-26#810" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2005-04-21#793" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2005-03-26#766" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2005-02-23#691" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2004-11-19#642" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2004-06-17#562" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2004-05-27#552" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2004-05-14#543" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2004-04-30#535" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2004-04-07#504" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2004-03-23#482" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2004-01-06#442" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-12-02#433" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-10-23#395" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-08-05#232" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-07-07#202" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-25#187" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-25#183" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-18#138" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-10#274" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-08#108" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-08#261" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-08#258" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-06#257" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-06#103" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-06#256" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-06#255" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-05#100" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-05#253" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-04#363" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-05-30#346" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-05-22#52" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-05-22#322" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-05-22#50" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-05-20#308" />
      <rdf:li rdf:resource="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-05-18#305" />
   </rdf:Seq>
  </rss:items>
 </rss:channel>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/vdb/blog/?date=2009-05-28#1558">
  <rss:title>Comparing Virtuoso Performance on Different Processors</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2009-05-28T14:54:59Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Over the years we have run Virtuoso on different hardware. We will here give a few figures that help identify the best price point for machines running Virtuoso. Our test is very simple: Load 20 warehouses of TPC-C data, and then run one client per warehouse for 10,000 new orders. The way this is set up, disk I/O does not play a role and lock contention between the clients is minimal. The test essentially has 20 server and 20 client threads running the same workload in parallel. The load time gives the single thread number; the 20 clients run gives the multi-threaded number. The test uses about 2-3 GB of data, so all is in RAM but is large enough not to be all in processor cache. All times reported are real times, starting from the start of the first client and ending with the completion of the last client. Do not confuse these results with official TPC-C. The measurement protocols are entirely incomparable. TABLE { background: none; border: none } TH { text-align: center; font-weight: bold } TR.top { background: } TD { text-align: center; border: none } Test Platform Load(seconds) Run(seconds) GHz / cores / threads 1 Amazon EC2 Extra Large(4 virtual cores) 340 42 1.2 GHz? / 4 / 1 1 Amazon EC2 Extra Large(4 virtual cores) 305 43.3 1.2 GHz? / 4 / 1 2 1 x dual-core AMD 5900 263 58.2 2.9 GHz / 2 / 1 3 2 x dual-core Xeon 5130 (&quot;Woodcrest&quot;) 245 35.7 2.0 GHz / 4 / 1 4 2 x quad-core Xeon 5410 (&quot;Harpertown&quot;) 237 18.0 2.33 GHz / 8 / 1 5 2 x quad-core Xeon 5520 (&quot;Nehalem&quot;) 162 18.3 2.26 GHz / 8 / 2 We tried two different EC2 instances to see if there would be variation. The variation was quite small. The tested EC2 instances costs 20 US cents per hour. The AMD dual-core costs 550 US dollars with 8G. The 3 Xeon configurations are Supermicro boards with 667MHz memory for the Xeon 5130 (&quot;Woodcrest&quot;) and Xeon 5410 (&quot;Harpertown&quot;), and 800MHz memory for the Nehalem. The Xeon systems cost between 4000 and 7000 US dollars, with 5000 for a configuration with 2 x Xeon 5520 (&quot;Nehalem&quot;), 72 GB RAM, and 8 x 500 GB SATA disks. Caveat: Due to slow memory (we could not get faster within available time), the results for the Nehalem do not take full advantage of its principal edge over the previous generation, i.e., memory subsystem. We&#39;ll see another time with faster memories. The operating systems were various 64 bit Linux distributions. We did some further measurements comparing Harpertown and Nehalem processors. The Nehalem chip was a bit faster for a slightly lower clock but we did not see any of the twofold and greater differences advertised by Intel. We tried some RDF operations on the two last systems: operation Harpertown Nehalem Build text index for DBpedia 1080s 770s Entity Rank iteration 263s 251s Then we tried to see if the core multithreading of Nehalem could be seen anywhere. To this effect, we ran the Fibonacci function in SQL to serve as an example of an all in-cache integer operation. 16 concurrent operations took exactly twice as long as 8 concurrent ones, as expected. For something that used memory, we took a count of RDF quads on two different indices, getting the same count. The database was a cluster setup with one process per core, so a count involved one thread per core. The counts in series took 5.02s and in parallel they took 4.27s. Then we took a more memory intensive piece that read the RDF quads table in the order of one index and for each row checked that there is the equal row on another, differently-partitioned index. This is a cross-partition join. One of the indices is read sequentially and the other at random. The throughput can be reported as random-lookups-per-second. The data was English DBpedia, about 140M triples. One such query takes a couple of minutes with a 650% CPU utilization. Running multiple such queries should show effects of core multithreading since we expect frequent cache misses. On the host OS of the Nehalem system â n cpu% rows per second 1 query 503 906,413 2 queries 1263 1,578,585 3 queries 1204 1,566,849 In a VM under Xen, on the Nehalem system â n cpu% rows per second 1 query 652 799,293 2 queries 1266 1,486,710 3 queries 1222 1,484,093 On the host OS of the Harpertown system â n cpu% rows per second 1 query 648 1,041,448 2 queries 708 1,124,866 The CPU percentages are as reported by the OS: user + system CPU divided by real time. So, Nehalem is in general somewhat faster, around 20-30%, than Harpertown. The effect of core multithreading can be noticed but is not huge, another 20% or so for situations with more threads than cores. The join where Harpertown did better could be attributed to its larger cache â 12 MB vs 8 MB. We see that Xen has a measurable but not prohibitive overhead; count a little under 10% for everything, also tasks with no I/O. The VM was set up to have all CPU for the test and the queries did not do disk I/O. The executables were compiled with gcc with default settings. Specifying -march=nocona (Core 2 target) dropped the cross-partition join time mentioned above from 128s to 122s on Harpertown. We did not try this on Nehalem but presume the effect would be the same, since the out-of-order unit is not much different. We did not do anything about process-to-memory affinity on Nehalem, which is a non-uniform architecture. We would expect this to increase performance since we have many equal size processes with even load. The mainstay of the Nehalem value proposition is a better memory subsystem. Since the unit we got was at 800 MHz memory, we did not see any great improvement. So if you buy Nehalem, you should make sure it is with 1333 MHz memory, else the best case will not be over 50% over a 667 MHz Core 2-based Xeon. Nehalem remains a better deal for us because of more memory per board. One Nehalem box with 72 GB costs less than two Harpertown boxes with 32 GB and offers almost the same performance. Having a lot of memory in a small space is key. With faster memory, it might even outperform two Harpertown boxes, but this remains to be seen. If space were not a constraint, we could make a cluster of 12 small workstations for the price of our largest system and get still more memory and more processor power per unit of memory. The Nehalem box was almost 4x faster than the AMD box but then it has 9x the memory, so the CPU to memory ratio might be better with the smaller boxes.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p>Over the years we have run <a href="http://virtuoso.openlinksw.com" id="link-id0x16735e20">Virtuoso</a> on different hardware. We will here give a few figures that help identify the best price point for machines running Virtuoso.</p>

<p>Our test is very simple: <i>Load 20 warehouses of <a href="http://dbpedia.org/resource/TPC-C" id="link-id0x16e0dba8">TPC-C</a> <a href="http://dbpedia.org/resource/Data" id="link-id0x14ff4f80">data</a>, and then run one client per warehouse for 10,000 new orders</i>. The way this is set up, disk I/O does not play a role and lock contention between the clients is minimal.</p>

<p>The test essentially has 20 server and 20 client threads running the same workload in parallel. The load time gives the single thread number; the 20 clients run gives the multi-threaded number. The test uses about 2-3 GB of data, so all is in RAM but is large enough not to be all in processor cache.</p>

<p>All times reported are real times, starting from the start of the first client and ending with the completion of the last client.</p>

<p>Do not confuse these results with official TPC-C. The measurement protocols are entirely incomparable.</p>

    <style type="text/css">
      TABLE  { background: none; border: none }
      TH     { text-align: center; font-weight: bold }
      TR.top { background:  }
      TD     { text-align: center; border: none }
    </style>

<table align="center" cellspacing="10">
<tr>
  <th>Test</th>
  <th>Platform</th>
  <th>Load<br />(seconds)</th>
  <th>Run<br />(seconds)</th>
  <th>GHz / cores / threads</th>
</tr>
<tr>
  <td>1</td>
  <td>Amazon <a href="http://aws.amazon.com/ec2/" id="link-id0x15d68e20">EC2</a> Extra Large<br />(4 virtual cores)</td>
  <td>340</td>
  <td>42</td>
  <td>1.2 GHz? / 4 / 1</td>
</tr>
<tr>
  <td>1</td>
  <td>Amazon EC2 Extra Large<br />(4 virtual cores)</td>
  <td>305</td>
  <td>43.3</td>
  <td>1.2 GHz? / 4 / 1</td>
</tr>
<tr>
  <td>2</td>
  <td>1 x dual-core AMD 5900</td>
  <td>263</td>
  <td>58.2</td>
  <td>2.9 GHz / 2 / 1</td>
</tr>
<tr>
  <td>3</td>
  <td>2 x dual-core Xeon 5130 (&quot;Woodcrest&quot;)</td>
  <td>245</td>
  <td>35.7</td>
  <td>2.0 GHz / 4 / 1</td>
</tr>
<tr>
  <td>4</td>
  <td>2 x quad-core Xeon 5410 (&quot;Harpertown&quot;)</td>
  <td>237</td>
  <td>18.0</td>
  <td>2.33 GHz / 8 / 1</td>
</tr>
<tr>
  <td>5</td>
  <td>2 x quad-core Xeon 5520 (&quot;Nehalem&quot;)</td>
  <td>162</td>
  <td>18.3</td>
  <td>2.26 GHz / 8 / 2</td>
</tr>
</table>

<p>We tried two different EC2 instances to see if there would be variation. The variation was quite small. The tested EC2 instances costs 20 US cents per hour. The AMD dual-core costs 550 US dollars with 8G. The 3 Xeon configurations are Supermicro boards with 667MHz memory for the Xeon 5130 (&quot;Woodcrest&quot;) and Xeon 5410 (&quot;Harpertown&quot;), and 800MHz memory for the Nehalem. The Xeon systems cost between 4000 and 7000 US dollars, with 5000 for a configuration with 2 x Xeon 5520 (&quot;Nehalem&quot;), 72 GB RAM, and 8 x 500 GB SATA disks.</p>

<p>
<i>Caveat: Due to slow memory (we could not get faster within available time), the results for the Nehalem do not take full advantage of its principal edge over the previous generation, i.e., memory subsystem. We&#39;ll see another time with faster memories.</i>
</p>

<p>The operating systems were various 64 bit Linux distributions.</p>

<p>We did some further measurements comparing Harpertown and Nehalem processors. The Nehalem chip was a bit faster for a slightly lower clock but we did not see any of the twofold and greater differences advertised by Intel.</p>

<p>We tried some <a href="http://dbpedia.org/resource/Resource_Description_Framework" id="link-id0x1460b688">RDF</a> operations on the two last systems:</p>

<table align="center" cellspacing="10">
<tr>
  <th>operation</th>
  <th> Harpertown</th>
  <th>Nehalem</th>
</tr>

<tr>
  <th>Build text index for <a href="http://dbpedia.org/resource/DBpedia" id="link-id0x16a94590">DBpedia</a></th>
  <td>1080s</td>
  <td>770s</td>
</tr>
<tr>
  <th><a href="http://dbpedia.org/resource/Entity" id="link-id0xc37f380">Entity</a> Rank iteration</th>
  <td>263s</td>
  <td>251s</td>
</tr>
</table>

<p>Then we tried to see if the core multithreading of Nehalem could be seen anywhere. To this effect, we ran the Fibonacci function in <a href="http://dbpedia.org/resource/SQL" id="link-id0x15842a20">SQL</a> to serve as an example of an all in-cache integer operation. 16 concurrent operations took exactly twice as long as 8 concurrent ones, as expected.</p>

<p>For something that used memory, we took a count of RDF quads on two different indices, getting the same count. The database was a cluster setup with one process per core, so a count involved one thread per core. The counts in series took 5.02s and in parallel they took 4.27s.</p>

<p>Then we took a more memory intensive piece that read the RDF quads table in the order of one index and for each row checked that there is the equal row on another, differently-partitioned index. This is a cross-partition join. One of the indices is read sequentially and the other at random. The throughput can be reported as random-lookups-per-second. The data was English DBpedia, about 140M triples. One such query takes a couple of minutes with a 650% CPU utilization. Running multiple such queries should show effects of core multithreading since we expect frequent cache misses.</p>

<ol>
<li>On the host OS of the Nehalem system â
<table align="center" cellspacing="10">
<tr>
      <th>n</th>
      <th>cpu%</th>
      <th>rows per second</th>
    </tr>
<tr>
      <th>1 query</th>
      <td>503</td>
      <td>906,413</td>
    </tr>
<tr>
      <th>2 queries</th>
      <td>1263</td>
      <td>1,578,585</td>
    </tr>
<tr>
      <th>3 queries</th>
      <td>1204</td>
      <td>1,566,849</td>
    </tr>
</table>
</li>
<li>In a VM under Xen, on the Nehalem system â
<table align="center" cellspacing="10">
<tr>
      <th>n</th>
      <th>cpu%</th>
      <th>rows per second</th>
    </tr>
<tr>
      <th>1 query</th>
      <td>652</td>
      <td>799,293</td>
    </tr>
<tr>
      <th>2 queries</th>
      <td>1266</td>
      <td>1,486,710</td>
    </tr>
<tr>
      <th>3 queries</th>
      <td>1222</td>
      <td>1,484,093</td>
    </tr>
</table>
</li>
<li> On the host OS of the Harpertown system â
<table align="center" cellspacing="10">
<tr>
      <th>n</th>
      <th>cpu%</th>
      <th>rows per second</th>
    </tr>
<tr>
      <th>1 query</th>
      <td> 648 </td>
      <td> 1,041,448 </td>
    </tr>
<tr>
      <th>2 queries</th>
      <td> 708 </td>
      <td> 1,124,866 </td>
    </tr>
</table>
</li>
</ol>

<p>The CPU percentages are as reported by the OS: user + system CPU divided by real time.</p>

<p>So, Nehalem is in general somewhat faster, around 20-30%, than Harpertown. The effect of core multithreading can be noticed but is not huge, another 20% or so for situations with more threads than cores. The join where Harpertown did better could be attributed to its larger cache â 12 MB vs 8 MB.</p>

<p>We see that Xen has a measurable but not prohibitive overhead; count a little under 10% for everything, also tasks with no I/O. The VM was set up to have all CPU for the test and the queries did not do disk I/O.</p>

<p>The executables were compiled with <code>gcc</code> with default settings. Specifying <code>-march=nocona</code> (Core 2 target) dropped the cross-partition join time mentioned above from 128s to 122s on Harpertown. We did not try this on Nehalem but presume the effect would be the same, since the out-of-order unit is not much different. We did not do anything about process-to-memory affinity on Nehalem, which is a non-uniform architecture. We would expect this to increase performance since we have many equal size processes with even load.</p>

<p>The mainstay of the Nehalem value proposition is a better memory subsystem. Since the unit we got was at 800 MHz memory, we did not see any great improvement. So if you buy Nehalem, you should make sure it is with 1333 MHz memory, else the best case will not be over 50% over a 667 MHz Core 2-based Xeon.</p>

<p>Nehalem remains a better deal for us because of more memory per board. One Nehalem box with 72 GB costs less than two Harpertown boxes with 32 GB and offers almost the same performance. Having a lot of memory in a small space is key. With faster memory, it might even outperform two Harpertown boxes, but this remains to be seen.</p>

<p>If space were not a constraint, we could make a cluster of 12 small workstations for the price of our largest system and get still more memory and more processor power per unit of memory. The Nehalem box was almost 4x faster than the AMD box but then it has 9x the memory, so the CPU to memory ratio might be better with the smaller boxes.</p>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/weblog/oerling/?date=2009-05-28#1557">
  <rss:title>Comparing Virtuoso Performance on Different Processors</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2009-05-28T14:54:59Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Over the years we have run Virtuoso on different hardware. We will here give a few figures that help identify the best price point for machines running Virtuoso. Our test is very simple: Load 20 warehouses of TPC-C data, and then run one client per warehouse for 10,000 new orders. The way this is set up, disk I/O does not play a role and lock contention between the clients is minimal. The test essentially has 20 server and 20 client threads running the same workload in parallel. The load time gives the single thread number; the 20 clients run gives the multi-threaded number. The test uses about 2-3 GB of data, so all is in RAM but is large enough not to be all in processor cache. All times reported are real times, starting from the start of the first client and ending with the completion of the last client. Do not confuse these results with official TPC-C. The measurement protocols are entirely incomparable. TABLE { background: none; border: none } TH { text-align: center; font-weight: bold } TR.top { background: } TD { text-align: center; border: none } Test Platform Load(seconds) Run(seconds) GHz / cores / threads 1 Amazon EC2 Extra Large(4 virtual cores) 340 42 1.2 GHz? / 4 / 1 1 Amazon EC2 Extra Large(4 virtual cores) 305 43.3 1.2 GHz? / 4 / 1 2 1 x dual-core AMD 5900 263 58.2 2.9 GHz / 2 / 1 3 2 x dual-core Xeon 5130 (&quot;Woodcrest&quot;) 245 35.7 2.0 GHz / 4 / 1 4 2 x quad-core Xeon 5410 (&quot;Harpertown&quot;) 237 18.0 2.33 GHz / 8 / 1 5 2 x quad-core Xeon 5520 (&quot;Nehalem&quot;) 162 18.3 2.26 GHz / 8 / 2 We tried two different EC2 instances to see if there would be variation. The variation was quite small. The tested EC2 instances costs 20 US cents per hour. The AMD dual-core costs 550 US dollars with 8G. The 3 Xeon configurations are Supermicro boards with 667MHz memory for the Xeon 5130 (&quot;Woodcrest&quot;) and Xeon 5410 (&quot;Harpertown&quot;), and 800MHz memory for the Nehalem. The Xeon systems cost between 4000 and 7000 US dollars, with 5000 for a configuration with 2 x Xeon 5520 (&quot;Nehalem&quot;), 72 GB RAM, and 8 x 500 GB SATA disks. Caveat: Due to slow memory (we could not get faster within available time), the results for the Nehalem do not take full advantage of its principal edge over the previous generation, i.e., memory subsystem. We&#39;ll see another time with faster memories. The operating systems were various 64 bit Linux distributions. We did some further measurements comparing Harpertown and Nehalem processors. The Nehalem chip was a bit faster for a slightly lower clock but we did not see any of the twofold and greater differences advertised by Intel. We tried some RDF operations on the two last systems: operation Harpertown Nehalem Build text index for DBpedia 1080s 770s Entity Rank iteration 263s 251s Then we tried to see if the core multithreading of Nehalem could be seen anywhere. To this effect, we ran the Fibonacci function in SQL to serve as an example of an all in-cache integer operation. 16 concurrent operations took exactly twice as long as 8 concurrent ones, as expected. For something that used memory, we took a count of RDF quads on two different indices, getting the same count. The database was a cluster setup with one process per core, so a count involved one thread per core. The counts in series took 5.02s and in parallel they took 4.27s. Then we took a more memory intensive piece that read the RDF quads table in the order of one index and for each row checked that there is the equal row on another, differently-partitioned index. This is a cross-partition join. One of the indices is read sequentially and the other at random. The throughput can be reported as random-lookups-per-second. The data was English DBpedia, about 140M triples. One such query takes a couple of minutes with a 650% CPU utilization. Running multiple such queries should show effects of core multithreading since we expect frequent cache misses. On the host OS of the Nehalem system â n cpu% rows per second 1 query 503 906,413 2 queries 1263 1,578,585 3 queries 1204 1,566,849 In a VM under Xen, on the Nehalem system â n cpu% rows per second 1 query 652 799,293 2 queries 1266 1,486,710 3 queries 1222 1,484,093 On the host OS of the Harpertown system â n cpu% rows per second 1 query 648 1,041,448 2 queries 708 1,124,866 The CPU percentages are as reported by the OS: user + system CPU divided by real time. So, Nehalem is in general somewhat faster, around 20-30%, than Harpertown. The effect of core multithreading can be noticed but is not huge, another 20% or so for situations with more threads than cores. The join where Harpertown did better could be attributed to its larger cache â 12 MB vs 8 MB. We see that Xen has a measurable but not prohibitive overhead; count a little under 10% for everything, also tasks with no I/O. The VM was set up to have all CPU for the test and the queries did not do disk I/O. The executables were compiled with gcc with default settings. Specifying -march=nocona (Core 2 target) dropped the cross-partition join time mentioned above from 128s to 122s on Harpertown. We did not try this on Nehalem but presume the effect would be the same, since the out-of-order unit is not much different. We did not do anything about process-to-memory affinity on Nehalem, which is a non-uniform architecture. We would expect this to increase performance since we have many equal size processes with even load. The mainstay of the Nehalem value proposition is a better memory subsystem. Since the unit we got was at 800 MHz memory, we did not see any great improvement. So if you buy Nehalem, you should make sure it is with 1333 MHz memory, else the best case will not be over 50% over a 667 MHz Core 2-based Xeon. Nehalem remains a better deal for us because of more memory per board. One Nehalem box with 72 GB costs less than two Harpertown boxes with 32 GB and offers almost the same performance. Having a lot of memory in a small space is key. With faster memory, it might even outperform two Harpertown boxes, but this remains to be seen. If space were not a constraint, we could make a cluster of 12 small workstations for the price of our largest system and get still more memory and more processor power per unit of memory. The Nehalem box was almost 4x faster than the AMD box but then it has 9x the memory, so the CPU to memory ratio might be better with the smaller boxes.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p>Over the years we have run <a href="http://virtuoso.openlinksw.com" id="link-id0xd420b90">Virtuoso</a> on different hardware. We will here give a few figures that help identify the best price point for machines running Virtuoso.</p>

<p>Our test is very simple: <i>Load 20 warehouses of <a href="http://dbpedia.org/resource/TPC-C" id="link-id0xdaaec90">TPC-C</a> <a href="http://dbpedia.org/resource/Data" id="link-id0xca1b7e0">data</a>, and then run one client per warehouse for 10,000 new orders</i>. The way this is set up, disk I/O does not play a role and lock contention between the clients is minimal.</p>

<p>The test essentially has 20 server and 20 client threads running the same workload in parallel. The load time gives the single thread number; the 20 clients run gives the multi-threaded number. The test uses about 2-3 GB of data, so all is in RAM but is large enough not to be all in processor cache.</p>

<p>All times reported are real times, starting from the start of the first client and ending with the completion of the last client.</p>

<p>Do not confuse these results with official TPC-C. The measurement protocols are entirely incomparable.</p>

    <style type="text/css">
      TABLE  { background: none; border: none }
      TH     { text-align: center; font-weight: bold }
      TR.top { background:  }
      TD     { text-align: center; border: none }
    </style>

<table align="center" cellspacing="10">
<tr>
  <th>Test</th>
  <th>Platform</th>
  <th>Load<br />(seconds)</th>
  <th>Run<br />(seconds)</th>
  <th>GHz / cores / threads</th>
</tr>
<tr>
  <td>1</td>
  <td>Amazon <a href="http://aws.amazon.com/ec2/" id="link-id0xdaab030">EC2</a> Extra Large<br />(4 virtual cores)</td>
  <td>340</td>
  <td>42</td>
  <td>1.2 GHz? / 4 / 1</td>
</tr>
<tr>
  <td>1</td>
  <td>Amazon EC2 Extra Large<br />(4 virtual cores)</td>
  <td>305</td>
  <td>43.3</td>
  <td>1.2 GHz? / 4 / 1</td>
</tr>
<tr>
  <td>2</td>
  <td>1 x dual-core AMD 5900</td>
  <td>263</td>
  <td>58.2</td>
  <td>2.9 GHz / 2 / 1</td>
</tr>
<tr>
  <td>3</td>
  <td>2 x dual-core Xeon 5130 (&quot;Woodcrest&quot;)</td>
  <td>245</td>
  <td>35.7</td>
  <td>2.0 GHz / 4 / 1</td>
</tr>
<tr>
  <td>4</td>
  <td>2 x quad-core Xeon 5410 (&quot;Harpertown&quot;)</td>
  <td>237</td>
  <td>18.0</td>
  <td>2.33 GHz / 8 / 1</td>
</tr>
<tr>
  <td>5</td>
  <td>2 x quad-core Xeon 5520 (&quot;Nehalem&quot;)</td>
  <td>162</td>
  <td>18.3</td>
  <td>2.26 GHz / 8 / 2</td>
</tr>
</table>

<p>We tried two different EC2 instances to see if there would be variation. The variation was quite small. The tested EC2 instances costs 20 US cents per hour. The AMD dual-core costs 550 US dollars with 8G. The 3 Xeon configurations are Supermicro boards with 667MHz memory for the Xeon 5130 (&quot;Woodcrest&quot;) and Xeon 5410 (&quot;Harpertown&quot;), and 800MHz memory for the Nehalem. The Xeon systems cost between 4000 and 7000 US dollars, with 5000 for a configuration with 2 x Xeon 5520 (&quot;Nehalem&quot;), 72 GB RAM, and 8 x 500 GB SATA disks.</p>

<p>
<i>Caveat: Due to slow memory (we could not get faster within available time), the results for the Nehalem do not take full advantage of its principal edge over the previous generation, i.e., memory subsystem. We&#39;ll see another time with faster memories.</i>
</p>

<p>The operating systems were various 64 bit Linux distributions.</p>

<p>We did some further measurements comparing Harpertown and Nehalem processors. The Nehalem chip was a bit faster for a slightly lower clock but we did not see any of the twofold and greater differences advertised by Intel.</p>

<p>We tried some <a href="http://dbpedia.org/resource/Resource_Description_Framework" id="link-id0xce85438">RDF</a> operations on the two last systems:</p>

<table align="center" cellspacing="10">
<tr>
  <th>operation</th>
  <th> Harpertown</th>
  <th>Nehalem</th>
</tr>

<tr>
  <th>Build text index for <a href="http://dbpedia.org/resource/DBpedia" id="link-id0xab826a8">DBpedia</a></th>
  <td>1080s</td>
  <td>770s</td>
</tr>
<tr>
  <th><a href="http://dbpedia.org/resource/Entity" id="link-id0xcbb9938">Entity</a> Rank iteration</th>
  <td>263s</td>
  <td>251s</td>
</tr>
</table>

<p>Then we tried to see if the core multithreading of Nehalem could be seen anywhere. To this effect, we ran the Fibonacci function in <a href="http://dbpedia.org/resource/SQL" id="link-id0xcd62218">SQL</a> to serve as an example of an all in-cache integer operation. 16 concurrent operations took exactly twice as long as 8 concurrent ones, as expected.</p>

<p>For something that used memory, we took a count of RDF quads on two different indices, getting the same count. The database was a cluster setup with one process per core, so a count involved one thread per core. The counts in series took 5.02s and in parallel they took 4.27s.</p>

<p>Then we took a more memory intensive piece that read the RDF quads table in the order of one index and for each row checked that there is the equal row on another, differently-partitioned index. This is a cross-partition join. One of the indices is read sequentially and the other at random. The throughput can be reported as random-lookups-per-second. The data was English DBpedia, about 140M triples. One such query takes a couple of minutes with a 650% CPU utilization. Running multiple such queries should show effects of core multithreading since we expect frequent cache misses.</p>

<ol>
<li>On the host OS of the Nehalem system â
<table align="center" cellspacing="10">
<tr>
      <th>n</th>
      <th>cpu%</th>
      <th>rows per second</th>
    </tr>
<tr>
      <th>1 query</th>
      <td>503</td>
      <td>906,413</td>
    </tr>
<tr>
      <th>2 queries</th>
      <td>1263</td>
      <td>1,578,585</td>
    </tr>
<tr>
      <th>3 queries</th>
      <td>1204</td>
      <td>1,566,849</td>
    </tr>
</table>
</li>
<li>In a VM under Xen, on the Nehalem system â
<table align="center" cellspacing="10">
<tr>
      <th>n</th>
      <th>cpu%</th>
      <th>rows per second</th>
    </tr>
<tr>
      <th>1 query</th>
      <td>652</td>
      <td>799,293</td>
    </tr>
<tr>
      <th>2 queries</th>
      <td>1266</td>
      <td>1,486,710</td>
    </tr>
<tr>
      <th>3 queries</th>
      <td>1222</td>
      <td>1,484,093</td>
    </tr>
</table>
</li>
<li> On the host OS of the Harpertown system â
<table align="center" cellspacing="10">
<tr>
      <th>n</th>
      <th>cpu%</th>
      <th>rows per second</th>
    </tr>
<tr>
      <th>1 query</th>
      <td> 648 </td>
      <td> 1,041,448 </td>
    </tr>
<tr>
      <th>2 queries</th>
      <td> 708 </td>
      <td> 1,124,866 </td>
    </tr>
</table>
</li>
</ol>

<p>The CPU percentages are as reported by the OS: user + system CPU divided by real time.</p>

<p>So, Nehalem is in general somewhat faster, around 20-30%, than Harpertown. The effect of core multithreading can be noticed but is not huge, another 20% or so for situations with more threads than cores. The join where Harpertown did better could be attributed to its larger cache â 12 MB vs 8 MB.</p>

<p>We see that Xen has a measurable but not prohibitive overhead; count a little under 10% for everything, also tasks with no I/O. The VM was set up to have all CPU for the test and the queries did not do disk I/O.</p>

<p>The executables were compiled with <code>gcc</code> with default settings. Specifying <code>-march=nocona</code> (Core 2 target) dropped the cross-partition join time mentioned above from 128s to 122s on Harpertown. We did not try this on Nehalem but presume the effect would be the same, since the out-of-order unit is not much different. We did not do anything about process-to-memory affinity on Nehalem, which is a non-uniform architecture. We would expect this to increase performance since we have many equal size processes with even load.</p>

<p>The mainstay of the Nehalem value proposition is a better memory subsystem. Since the unit we got was at 800 MHz memory, we did not see any great improvement. So if you buy Nehalem, you should make sure it is with 1333 MHz memory, else the best case will not be over 50% over a 667 MHz Core 2-based Xeon.</p>

<p>Nehalem remains a better deal for us because of more memory per board. One Nehalem box with 72 GB costs less than two Harpertown boxes with 32 GB and offers almost the same performance. Having a lot of memory in a small space is key. With faster memory, it might even outperform two Harpertown boxes, but this remains to be seen.</p>

<p>If space were not a constraint, we could make a cluster of 12 small workstations for the price of our largest system and get still more memory and more processor power per unit of memory. The Nehalem box was almost 4x faster than the AMD box but then it has 9x the memory, so the CPU to memory ratio might be better with the smaller boxes.</p>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2009-03-30#1539">
  <rss:title>Live Virtuoso instance hosting Linked Open Data (LOD) Cloud</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2009-03-30T16:27:26Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">We have reached a beachead re. the Virtuoso instance hosting the Linked Open Data (LOD) Cloud; meaning, we are not going to be performing any major updates and deletions short-term, bar incorporation of fresh data sets from the Freebase and Bio2RDF projects (both communities a prepping new RDF data sets). At the current time we have loaded 100% of all the very large data sets from the LOD Cloud. As result, we can start the process of exposing Linked Data virtues in a manner that&#39;s palatable to users, developers, and database professionals across the Web 1.0, 2.0, and 3.0 spectrums. What does this mean? You can use the &quot;Search &amp; Find&quot; or&quot;URI Lookup&quot; or SPARQL endpoint associated with the LOD cloud hosting instance to perform the following tasks: Find entities associated with full text search patterns -- Google Style, but with Entity &amp; Text proximity Rank instead of Page Rank, since we are dealing with Entities rather than documents about entities Find and Lookup entities by Identifier (URI) -- which is helpful when locating URIs to use for identify entities in your own linked data spaces on the Web View entity descriptions via a variety of representation formats (HTML, RDFa, RDF/XML, N3, Turtle etc.) Determine uses of entity identifiers across the LOD cloud -- which helps you select preferred URIs based on usage statistics. What does it offer Web 1.0 and 2.0 developers? If you don&#39;t want to use the SPARQL based Web Service, or other Linked Data Web oriented APIs for interacting with the LOD cloud programmatically, you can simply use the powerful REST style Web Service that provides URL parameters for performing full text oriented &quot;Search&quot;, entity oriented &quot;Find&quot; queries, and faceted navigation over the huge data corpus with results data returned in JSON and XML formats. Next Steps: Amazon have agreed to add all the LOD Cloud data sets to their existing public data sets collective. Thus, the data sets we are loading will be available in &quot;raw data&quot; (RDF) format on the public data sets page via Named Elastic Block Storage (EBS) Snapshots); meaning, you can make an EC2 AMI (e.g. a Linux, Windows, Solaris) and install an RDF quad or triple store of choice into your AMI, then simply load data from the LOD cloud based on your needs. In addition to the above, we are also going to offer a Virtuoso 6.0 Cluster Edition based LOD Cloud AMI (as we&#39;ve already done with DBpedia, MusicBrainz, NeuroCommons, and Bio2Rdf) that will enable you to simply instantiate a personal and service specific edition of Virtuoso with all the LOD data in place and fully tuned for performance and scalability; basically, you will simply press &quot;Instantiate AMI&quot; and a LOD cloud data space, in true Linked Data from, will be at your disposal within minutes (i.e. the time it takes the DB to start). Work on the migration of the LOD data to EC2 starts this week. Thus, if you are interested in contributing an RDF based data set to the LOD cloud now is the time to get your archive links in place on the (see: ESW Wiki page for LOD Data Sets).</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<p>We have reached a beachead re. the <a href="http://lod.openlinksw.com" id="link-id11a035e0">Virtuoso instance hosting the Linked Open Data (LOD) Cloud</a>; meaning, we are not going to be performing any major updates and deletions short-term, bar incorporation of fresh data sets from the Freebase and <a href="http://www.bio2rdf.org/" id="link-id121d7278">Bio2RDF</a> projects (both communities a prepping new RDF data sets).</p>  <p>At the current time we have loaded 100% of all the very large data sets from the <a href="http://www4.wiwiss.fu-berlin.de/bizer/pub/lod-datasets_2009-03-05.html" id="link-id1441f7e0">LOD Cloud</a>. As result, we can start the process of exposing <a href="http://dbpedia.org/resource/Linked_Data" id="link-id16c53de8">Linked Data</a> virtues in a manner that&#39;s palatable to users, developers, and database professionals across the <a href="http://dbpedia.org/resource/World_Wide_Web" id="link-id0x20165290">Web</a> 1.0, 2.0, and 3.0 spectrums.</p>  <h3>What does this mean?</h3> <p>You can use the &quot;Search &amp; Find&quot; or&quot;<a href="http://dbpedia.org/resource/Uniform_Resource_Identifier" id="link-id119c6878">URI</a> Lookup&quot; or <a href="http://dbpedia.org/resource/SPARQL" id="link-id157acde8">SPARQL</a> endpoint associated with the LOD cloud hosting instance to perform the following tasks:</p> <p>  </p> <ol> <li>Find entities associated with <a href="http://dbpedia.org/resource/Full_text_search" id="link-id11a82f28">full text search</a> patterns -- Google Style, but with <a href="http://dbpedia.org/resource/Entity" id="link-id131b6380">Entity</a> &amp; Text proximity Rank instead of Page Rank, since we are dealing with Entities rather than documents about entities</li> <li>Find and Lookup entities by Identifier (URI) -- which is helpful when locating URIs to use for identify entities in your own linked data spaces on the Web</li> <li>View entity descriptions via a variety of representation formats (HTML, <a href="http://dbpedia.org/resource/RDFa" id="link-id11e323b0">RDFa</a>, RDF/XML, N3, Turtle etc.)</li> <li>Determine uses of entity identifiers across the LOD cloud -- which helps you select preferred URIs based on usage statistics.</li> </ol>  <h3>What does it offer Web 1.0 and 2.0 developers?</h3> <p> If you don&#39;t want to use the <a href="http://lod.openlinksw.com/sparql" id="link-id15c1ec30">SPARQL based Web Service</a>, or other Linked Data <a href="http://dbpedia.org/resource/Giant_Global_Graph" id="link-id15ebd3b0">Web</a> oriented APIs for interacting with the LOD cloud programmatically, you can simply use the powerful <a href="http://virtuoso.openlinksw.com/dataspace/dav/wiki/Main/VirtuosoFacetsWebService" id="link-id12e556a8">REST style Web Service</a> that provides <a href="http://dbpedia.org/resource/Uniform_Resource_Locator" id="link-id12138090">URL</a> parameters for performing full text oriented &quot;Search&quot;, entity oriented &quot;Find&quot; queries, and faceted navigation over the huge data corpus with results data returned in JSON and XML formats.</p>  <h3>Next Steps:</h3> <p> Amazon have agreed to add all the LOD Cloud data sets to their existing <a href="http://aws.amazon.com/publicdatasets" id="link-id11989aa8">public data sets collective</a>. Thus, the data sets we are loading will be available in &quot;raw data&quot; (RDF) format on the public data sets page via Named Elastic Block Storage (EBS) Snapshots); meaning, you can make an EC2 AMI (e.g. a Linux, Windows, Solaris) and install an RDF quad or triple store of choice into your AMI, then simply load data from the LOD cloud based on your needs.</p> <p> In addition to the above, we are also going to offer a <a href="http://virtuoso.openlinksw.com/dataspace/dav/wiki/Main/VirtInstallationEC2" id="link-id13982a88">Virtuoso 6.0 Cluster Edition based LOD Cloud AMI</a> (as we&#39;ve already done with <a href="http://virtuoso.openlinksw.com/dataspace/dav/wiki/Main/VirtEC2AMIDBpediaInstall" id="link-id12cba108">DBpedia</a>, <a href="http://virtuoso.openlinksw.com/dataspace/dav/wiki/Main/VirtEC2AMIMusicBrainzInstall" id="link-id1390d338">MusicBrainz</a>, <a href="http://virtuoso.openlinksw.com/dataspace/dav/wiki/Main/VirtEC2AMINeuroCommonsInstall" id="link-id15801668">NeuroCommons</a>, and <a href="http://virtuoso.openlinksw.com/dataspace/dav/wiki/Main/VirtEC2AMIBio2rdfInstall" id="link-id133e0840">Bio2Rdf</a>) that will enable you to simply instantiate a personal and service specific edition of Virtuoso with all the LOD data in place and fully tuned for performance and scalability; basically, you will simply press &quot;Instantiate AMI&quot; and a LOD cloud <a href="http://en.wikipedia.org/wiki/Data_Spaces" id="link-id15ccbf80">data space</a>, in true Linked Data from, will be at your disposal within minutes (i.e. the time it takes the DB to start).</p>  <p>Work on the migration of the LOD data to EC2 starts this week. Thus, if you are interested in contributing an RDF based data set to the LOD cloud now is the time to get your archive links in place on the (see: <a href="http://esw.w3.org/topic/DataSetRDFDumps" id="link-id154d6f88">ESW Wiki page for LOD Data Sets</a>).</p> 
]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/vdb/blog/?date=2008-12-17#1503">
  <rss:title>See the Lite:  Embeddable/Background Virtuoso starts at 25MB</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2008-12-17T09:34:12Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">We have received many requests for an embeddable-scale Virtuoso. In response to this, we have added a Lite mode, where the initial size of a server process is a tiny fraction of what the initial size would be with default settings. With 2MB of disk cache buffers (ini file setting, NumberOfBuffers = 256), the process size stays under 30MB on 32-bit Linux. The value of this is that one can now have RDF and full text indexing on the desktop without running a Java VM or any other memory-intensive software. And of course, all of SQL (transactions, stored procedures, etc.) is in the same embeddably-sized container. The Lite executable is a full Virtuoso executable; the Lite mode is controlled by a switch in the configuration file. The executable size is about 10MB for 32-bit Linux. A database created in the Lite mode will be converted into a fully-featured database (tables and indexes are added, among other things) if the server is started with the Lite setting &quot;off&quot;; functionality can be reverted to Lite mode, though it will now consume somewhat more memory, etc. Lite mode offers full SQL and SPARQL/SPARUL (via SPASQL), but disables all HTTP-based services (WebDAV, application hosting, etc.). Clients can still use all typical database access mechanisms (i.e., ODBC, JDBC, OLE-DB, ADO.NET, and XMLA) to connect, including the Jena and Sesame frameworks for RDF. ODBC now offers full support of RDF data types for C-based clients. A Redland-compatible API also exists, for use with Redland v1.0.8 and later. Especially for embedded use, we now allow restricting the listener to be a Unix socket, which allows client connections only from the localhost. Shipping an embedded Virtuoso is easy. It just takes one executable and one configuration file. Performance is generally comparable to &quot;normal&quot; mode, except that Lite will be somewhat less scalable on multicore systems. The Lite mode will be included in the next Virtuoso 5 Open Source release.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p>We have received many requests for an embeddable-scale <a href="http://virtuoso.openlinksw.com" id="link-id0x1cd69650">Virtuoso</a>.  In response to this, we have added a Lite mode, where the initial size of a server process is a tiny fraction of what the initial size would be with default settings.  With 2MB of disk cache buffers (ini file setting, <code>NumberOfBuffers = 256</code>), the process size stays under 30MB on 32-bit Linux.</p>

<p>The value of this is that one can now have <a href="http://dbpedia.org/resource/Resource_Description_Framework" id="link-id0x1ce89340">RDF</a> and full text indexing on the desktop without running a Java VM or any other memory-intensive software.  And of course, all of <a href="http://dbpedia.org/resource/SQL" id="link-id0x1cfc9288">SQL</a> (transactions, stored procedures, etc.) is in the same embeddably-sized container.</p>

<p>The Lite executable is a full Virtuoso executable; the Lite mode is controlled by a switch in the configuration file.  The executable size is about 10MB for 32-bit Linux.  A database created in the Lite mode will be converted into a fully-featured database (tables and indexes are added, among other things) if the server is started with the Lite setting &quot;off&quot;; functionality can be reverted to Lite mode, though it will now consume somewhat more memory, etc.</p>

<p>Lite mode offers full SQL and <a href="http://dbpedia.org/resource/SPARQL" id="link-id0x1c511da8">SPARQL</a>/SPARUL (via SPASQL), but disables all <a href="http://dbpedia.org/resource/Hypertext_Transfer_Protocol" id="link-id0x1dac1950">HTTP</a>-based services (WebDAV, application hosting, etc.).  Clients can still use all typical database access mechanisms (i.e., <a href="http://dbpedia.org/resource/Open_Database_Connectivity" id="link-id0xb19a488">ODBC</a>, <a href="http://dbpedia.org/resource/Java_Database_Connectivity" id="link-id0x1d93ee40">JDBC</a>, OLE-DB, <a href="http://dbpedia.org/resource/ADO.NET" id="link-id0x1ce391c0">ADO</a>.<a href="http://dbpedia.org/resource/.NET_Framework" id="link-id0xacf1168">NET</a>, and XMLA) to connect, including the <a href="http://jena.sourceforge.net/" id="link-id0xaaf5b58">Jena</a> and <a href="http://sourceforge.net/projects/sesame/" id="link-id0x1b1e4328">Sesame</a> frameworks for RDF.  ODBC now offers full support of RDF <a href="http://dbpedia.org/resource/Data" id="link-id0x1cfc9f78">data</a> types for <a href="http://dbpedia.org/resource/C%2B%2B" id="link-id0xa6059d8">C</a>-based clients.  A Redland-compatible API also exists, for use with Redland v1.0.8 and later. </p>

<p>Especially for embedded use, we now allow restricting the listener to be a Unix socket, which allows client connections only from the localhost.</p>

<p>Shipping an embedded Virtuoso is easy.  It just takes one executable and one configuration file.  Performance is generally comparable to &quot;normal&quot; mode, except that Lite will be somewhat less scalable on multicore systems.</p>

<p>The Lite mode will be included in the next Virtuoso 5 Open Source release.</p>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/weblog/oerling/?date=2008-12-17#1502">
  <rss:title>See the Lite:  Embeddable/Background Virtuoso starts at 25MB</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2008-12-17T09:34:12Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">We have received many requests for an embeddable-scale Virtuoso. In response to this, we have added a Lite mode, where the initial size of a server process is a tiny fraction of what the initial size would be with default settings. With 2MB of disk cache buffers (ini file setting, NumberOfBuffers = 256), the process size stays under 30MB on 32-bit Linux. The value of this is that one can now have RDF and full text indexing on the desktop without running a Java VM or any other memory-intensive software. And of course, all of SQL (transactions, stored procedures, etc.) is in the same embeddably-sized container. The Lite executable is a full Virtuoso executable; the Lite mode is controlled by a switch in the configuration file. The executable size is about 10MB for 32-bit Linux. A database created in the Lite mode will be converted into a fully-featured database (tables and indexes are added, among other things) if the server is started with the Lite setting &quot;off&quot;; functionality can be reverted to Lite mode, though it will now consume somewhat more memory, etc. Lite mode offers full SQL and SPARQL/SPARUL (via SPASQL), but disables all HTTP-based services (WebDAV, application hosting, etc.). Clients can still use all typical database access mechanisms (i.e., ODBC, JDBC, OLE-DB, ADO.NET, and XMLA) to connect, including the Jena and Sesame frameworks for RDF. ODBC now offers full support of RDF data types for C-based clients. A Redland-compatible API also exists, for use with Redland v1.0.8 and later. Especially for embedded use, we now allow restricting the listener to be a Unix socket, which allows client connections only from the localhost. Shipping an embedded Virtuoso is easy. It just takes one executable and one configuration file. Performance is generally comparable to &quot;normal&quot; mode, except that Lite will be somewhat less scalable on multicore systems. The Lite mode will be included in the next Virtuoso 5 Open Source release.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p>We have received many requests for an embeddable-scale <a href="http://virtuoso.openlinksw.com" id="link-id0xa5aa1b38">Virtuoso</a>.  In response to this, we have added a Lite mode, where the initial size of a server process is a tiny fraction of what the initial size would be with default settings.  With 2MB of disk cache buffers (ini file setting, <code>NumberOfBuffers = 256</code>), the process size stays under 30MB on 32-bit Linux.</p>

<p>The value of this is that one can now have <a href="http://dbpedia.org/resource/Resource_Description_Framework" id="link-id0x1db79ac8">RDF</a> and full text indexing on the desktop without running a Java VM or any other memory-intensive software.  And of course, all of <a href="http://dbpedia.org/resource/SQL" id="link-id0xa923298">SQL</a> (transactions, stored procedures, etc.) is in the same embeddably-sized container.</p>

<p>The Lite executable is a full Virtuoso executable; the Lite mode is controlled by a switch in the configuration file.  The executable size is about 10MB for 32-bit Linux.  A database created in the Lite mode will be converted into a fully-featured database (tables and indexes are added, among other things) if the server is started with the Lite setting &quot;off&quot;; functionality can be reverted to Lite mode, though it will now consume somewhat more memory, etc.</p>

<p>Lite mode offers full SQL and <a href="http://dbpedia.org/resource/SPARQL" id="link-id0x1b388830">SPARQL</a>/SPARUL (via SPASQL), but disables all <a href="http://dbpedia.org/resource/Hypertext_Transfer_Protocol" id="link-id0x1d56b618">HTTP</a>-based services (WebDAV, application hosting, etc.).  Clients can still use all typical database access mechanisms (i.e., <a href="http://dbpedia.org/resource/Open_Database_Connectivity" id="link-id0x1c5abc38">ODBC</a>, <a href="http://dbpedia.org/resource/Java_Database_Connectivity" id="link-id0x1dade1f8">JDBC</a>, OLE-DB, <a href="http://dbpedia.org/resource/ADO.NET" id="link-id0x25d8e0f0">ADO</a>.<a href="http://dbpedia.org/resource/.NET_Framework" id="link-id0x1d7a1a28">NET</a>, and XMLA) to connect, including the <a href="http://jena.sourceforge.net/" id="link-id0x1d929b98">Jena</a> and <a href="http://sourceforge.net/projects/sesame/" id="link-id0x1b7a9088">Sesame</a> frameworks for RDF.  ODBC now offers full support of RDF <a href="http://dbpedia.org/resource/Data" id="link-id0xaf62aa0">data</a> types for <a href="http://dbpedia.org/resource/C%2B%2B" id="link-id0xa8784b0">C</a>-based clients.  A Redland-compatible API also exists, for use with Redland v1.0.8 and later. </p>

<p>Especially for embedded use, we now allow restricting the listener to be a Unix socket, which allows client connections only from the localhost.</p>

<p>Shipping an embedded Virtuoso is easy.  It just takes one executable and one configuration file.  Performance is generally comparable to &quot;normal&quot; mode, except that Lite will be somewhat less scalable on multicore systems.</p>

<p>The Lite mode will be included in the next Virtuoso 5 Open Source release.</p>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/vdb/blog/?date=2008-11-20#1485">
  <rss:title>Virtuoso Vs. MySQL:  Setting the Berlin Record Straight (update 2)</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2008-11-20T11:06:11Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">In the context of the Berlin SPARQL Benchmark, I have repeatedly written about measurement procedures and steady state. The point is that the numbers at larger scales are unreliable due to cache behavior if one is not careful about measurement and does not have adequate warmup. Thus it came to pass that one cut of the BSBM paper had 3 seconds for MySQL and 100 for Virtuoso, basically through ignoring cache effects. So we decided to do it ourselves. The score is (updated with revised innodb_buffer_pool_size setting, based on advice noted down below): n-clients Virtuoso MySQL (with increased buffer pool size) MySQL (with default buffer poll size) 1 41,161.33 27,023.11 12,171.41 4 127,918.30 (pending) 37,566.82 8 218,162.29 105,524.23 51,104.39 16 214,763.58 98,852.42 47,589.18 The metric is the query mixes per hour from the BSBM test driver output. For the interested, the complete output is here. The benchmark is pure SQL, nothing to do with SPARQL or RDF. The hardware is 2 x Xeon 5345 (2 x quad core, 2.33 GHz), 16 G RAM. The OS is 64-bit Debian Linux. The benchmark was run at a scale of 200,000. Each run had 2000 warm-up query mixes and 500 measured query mixes, which gives steady state, eliminating any effects of OS disk cache and the like. Both databases were configured to use 8G for disk cache. The test effectively runs from memory. We ran an analyze table on each MySQL table but noticed that this had no effect. Virtuoso does the stats sampling on the go; possibly MySQL also since the explicit stats did not make any difference. The MySQL tables were served by the InnoDB engine. MySQL appears to cache results of queries in some cases. This was not apparent in the tests. The versions are 5.09 for Virtuoso and 5.1.29 for MySQL. You can download and examine -- Virtuoso configuration file MySQL configuration file Table definitions &amp; RDF views Indexes on MySQL tables MySQL ought to do better. We suspect that here, just as in the TPC-D experiment we made way back, the query plans are not quite right. Also we rarely saw over 300% CPU utilization for MySQL. It is possible there is a config parameter that affects this. The public is invited to tell us about such. Update: Andreas Schultz of the BSBM team advised us to increase the innodb_buffer_pool_size setting in the MySQL config. We did and it produced some improvement. Indeed, this is more like it, as we now see CPU utilization around 700% instead of the 300% in the previously published run, which rendered it suspect. Also, our experiments with TPC-D led us to expect better. We ran these things a few times so as to have warm cache. On the first run, we noticed that the Innodb warm up time was somewhere well in excess of 2000 query mixes. Another time, we should make a graph of throughput as a function of time for both MySQL and Virtuoso. We recently made a greedy prefetch hack that should give us some mileage there. For the next BSBM, all we can advise is to run larger scale system for half an hour first and then measure and then measure again. If the second measurement is the same as the first then it is good. As always, since MySQL is not our specialty, we confidently invite the public to tell us how to make it run faster. So, unless something more turns up, our next trial is a revisit of TPC-H.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p>In the context of the <a href="http://www4.wiwiss.fu-berlin.de/bizer/BerlinSPARQLBenchmark/spec/index.html" id="link-id0xa322b58">Berlin SPARQL Benchmark</a>, I have repeatedly written about measurement procedures and steady state.  The point is that the numbers at larger scales are unreliable due to cache behavior if one is not careful about measurement and does not have adequate warmup.  Thus it came to pass that one cut of the <a href="http://www4.wiwiss.fu-berlin.de/bizer/BerlinSPARQLBenchmark/spec/index.html" id="link-id0x9524730">BSBM</a> paper had 3 seconds for <a href="http://dbpedia.org/resource/MySQL" id="link-id0x2ba8db0">MySQL</a> and 100 for <a href="http://virtuoso.openlinksw.com" id="link-id0xa9137d0">Virtuoso</a>, basically through ignoring cache effects.</p>

<p>So we decided to do it ourselves.</p>

<p>The score is (updated with revised <code>innodb_buffer_pool_size</code> setting, based on advice noted down below):</p>

<table border="1" cellspacing="2" cellpadding="5">
<tr>
    <th>n-clients</th>
    <th>Virtuoso</th>
    <th>MySQL <br /> (with increased buffer pool size)</th>
    <th>MySQL <br /> (with default buffer poll size)</th>
  </tr>
<tr align="right">
    <td>1</td>
    <td> 41,161.33</td>
    <td> 27,023.11 </td>
    <td> 12,171.41</td>
  </tr>
<tr align="right">
    <td>4</td>
    <td> 127,918.30</td>
    <td> (pending) </td>
    <td>  37,566.82</td>
  </tr>
<tr align="right">
    <td>8</td>
    <td> 218,162.29 </td>
    <td> 105,524.23 </td>
    <td>  51,104.39 </td>
  </tr>
<tr align="right">
    <td>16</td>
    <td> 214,763.58 </td>
    <td>  98,852.42 </td>
    <td>  47,589.18 </td>
  </tr>
</table>


<p>The metric is the query mixes per hour from the BSBM test driver output.  For the interested, the complete output is <a href="http://www.openlinksw.com/weblog/oerling/texts/bsbmres.txt" id="link-id1119f770">here</a>.</p>

<p>The benchmark is pure <a href="http://dbpedia.org/resource/SQL" id="link-id0x2b61c88">SQL</a>, nothing to do with <a href="http://dbpedia.org/resource/SPARQL" id="link-id0x17a6d408">SPARQL</a> or <a href="http://dbpedia.org/resource/Resource_Description_Framework" id="link-id0x9a0a968">RDF</a>.</p>

<p>The hardware is 2 x Xeon 5345 (2 x quad core, 2.33 GHz), 16 G RAM.  The OS is 64-bit Debian Linux.</p>

<p>The benchmark was run at a scale of 200,000.  Each run had 2000 warm-up query mixes and 500 measured query mixes, which gives steady state, eliminating any effects of OS disk cache and the like.  Both databases were configured to use 8G for disk cache.  The test effectively runs from memory.  We ran an analyze table on each MySQL table but noticed that this had no effect.  Virtuoso does the stats sampling on the go; possibly MySQL also since the explicit stats did not make any difference.  The MySQL tables were served by the InnoDB engine.  MySQL appears to cache results of queries in some cases.  This was not apparent in the tests.</p>

<p>The versions are 5.09 for Virtuoso and 5.1.29 for MySQL.  You can download and examine --</p>
<ul> 
<li>
<a href="http://www.openlinksw.com/weblog/oerling/texts/virtuoso.ini" id="link-id14fe17f0">Virtuoso configuration file</a>
</li>
<li>
<a href="http://www.openlinksw.com/weblog/oerling/texts/my.cnf" id="link-id116fe490">MySQL configuration file</a>
</li>
<li>
    <a href="http://www.openlinksw.com/weblog/oerling/texts/create_tables_and_rdf_view.sql" id="link-id14ce9268">Table definitions &amp; RDF views</a> 
</li>
<li> <a href="http://www.openlinksw.com/weblog/oerling/texts/mysqlinx.sql" id="link-id1535e298">Indexes on MySQL tables</a>
</li>
</ul>

<p>
<strike>MySQL ought to do better.  We suspect that here, just as in the TPC-D experiment we made way back, the query plans are not quite right. Also we rarely saw over 300% CPU utilization for MySQL.  It is possible there is a config parameter that affects this.  The public is invited to tell us about such.</strike>
</p>

<p>
<b>Update:</b>
</p>

<p>Andreas Schultz of the BSBM team advised us to increase the <code>innodb_buffer_pool_size</code> setting in the MySQL config.  We did and it produced some improvement.  Indeed, this is more like it, as we now see CPU utilization around 700% instead of the 300% in the previously published run, which rendered it suspect. Also, our experiments with TPC-D led us to expect better.  We ran these things a few times so as to have warm cache.</p>

<p>On the first run, we noticed that the Innodb warm up time was somewhere well in excess of 2000 query mixes.  Another time, we should make a graph of throughput as a function of time for both MySQL and Virtuoso.  We recently made a greedy prefetch hack that should give us some mileage there.  For the next BSBM, all we can advise is to run larger scale system for half an hour first and then measure and then measure again.  If the second measurement is the same as the first then it is good.</p>

<p>As always, since MySQL is not our specialty, we confidently invite the public to tell us how to make it run faster. So, unless something more turns up, our next trial is a revisit of <a href="http://dbpedia.org/resource/TPC-H" id="link-id0x17a20498">TPC-H</a>.</p>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/weblog/oerling/?date=2008-11-20#1484">
  <rss:title>Virtuoso Vs. MySQL:  Setting the Berlin Record Straight (update 2)</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2008-11-20T11:06:11Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">In the context of the Berlin SPARQL Benchmark, I have repeatedly written about measurement procedures and steady state. The point is that the numbers at larger scales are unreliable due to cache behavior if one is not careful about measurement and does not have adequate warmup. Thus it came to pass that one cut of the BSBM paper had 3 seconds for MySQL and 100 for Virtuoso, basically through ignoring cache effects. So we decided to do it ourselves. The score is (updated with revised innodb_buffer_pool_size setting, based on advice noted down below): n-clients Virtuoso MySQL (with increased buffer pool size) MySQL (with default buffer poll size) 1 41,161.33 27,023.11 12,171.41 4 127,918.30 (pending) 37,566.82 8 218,162.29 105,524.23 51,104.39 16 214,763.58 98,852.42 47,589.18 The metric is the query mixes per hour from the BSBM test driver output. For the interested, the complete output is here. The benchmark is pure SQL, nothing to do with SPARQL or RDF. The hardware is 2 x Xeon 5345 (2 x quad core, 2.33 GHz), 16 G RAM. The OS is 64-bit Debian Linux. The benchmark was run at a scale of 200,000. Each run had 2000 warm-up query mixes and 500 measured query mixes, which gives steady state, eliminating any effects of OS disk cache and the like. Both databases were configured to use 8G for disk cache. The test effectively runs from memory. We ran an analyze table on each MySQL table but noticed that this had no effect. Virtuoso does the stats sampling on the go; possibly MySQL also since the explicit stats did not make any difference. The MySQL tables were served by the InnoDB engine. MySQL appears to cache results of queries in some cases. This was not apparent in the tests. The versions are 5.09 for Virtuoso and 5.1.29 for MySQL. You can download and examine -- Virtuoso configuration file MySQL configuration file Table definitions &amp; RDF views Indexes on MySQL tables MySQL ought to do better. We suspect that here, just as in the TPC-D experiment we made way back, the query plans are not quite right. Also we rarely saw over 300% CPU utilization for MySQL. It is possible there is a config parameter that affects this. The public is invited to tell us about such. Update: Andreas Schultz of the BSBM team advised us to increase the innodb_buffer_pool_size setting in the MySQL config. We did and it produced some improvement. Indeed, this is more like it, as we now see CPU utilization around 700% instead of the 300% in the previously published run, which rendered it suspect. Also, our experiments with TPC-D led us to expect better. We ran these things a few times so as to have warm cache. On the first run, we noticed that the Innodb warm up time was somewhere well in excess of 2000 query mixes. Another time, we should make a graph of throughput as a function of time for both MySQL and Virtuoso. We recently made a greedy prefetch hack that should give us some mileage there. For the next BSBM, all we can advise is to run larger scale system for half an hour first and then measure and then measure again. If the second measurement is the same as the first then it is good. As always, since MySQL is not our specialty, we confidently invite the public to tell us how to make it run faster. So, unless something more turns up, our next trial is a revisit of TPC-H.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p>In the context of the <a href="http://www4.wiwiss.fu-berlin.de/bizer/BerlinSPARQLBenchmark/spec/index.html" id="link-id0xa5314d8">Berlin SPARQL Benchmark</a>, I have repeatedly written about measurement procedures and steady state.  The point is that the numbers at larger scales are unreliable due to cache behavior if one is not careful about measurement and does not have adequate warmup.  Thus it came to pass that one cut of the <a href="http://www4.wiwiss.fu-berlin.de/bizer/BerlinSPARQLBenchmark/spec/index.html" id="link-id0x18482c20">BSBM</a> paper had 3 seconds for <a href="http://dbpedia.org/resource/MySQL" id="link-id0xb8c54de8">MySQL</a> and 100 for <a href="http://virtuoso.openlinksw.com" id="link-id0x189b2210">Virtuoso</a>, basically through ignoring cache effects.</p>

<p>So we decided to do it ourselves.</p>

<p>The score is (updated with revised <code>innodb_buffer_pool_size</code> setting, based on advice noted down below):</p>

<table border="1" cellspacing="2" cellpadding="5">
<tr>
    <th>n-clients</th>
    <th>Virtuoso</th>
    <th>MySQL <br /> (with increased buffer pool size)</th>
    <th>MySQL <br /> (with default buffer poll size)</th>
  </tr>
<tr align="right">
    <td>1</td>
    <td> 41,161.33</td>
    <td> 27,023.11 </td>
    <td> 12,171.41</td>
  </tr>
<tr align="right">
    <td>4</td>
    <td> 127,918.30</td>
    <td> (pending) </td>
    <td>  37,566.82</td>
  </tr>
<tr align="right">
    <td>8</td>
    <td> 218,162.29 </td>
    <td> 105,524.23 </td>
    <td>  51,104.39 </td>
  </tr>
<tr align="right">
    <td>16</td>
    <td> 214,763.58 </td>
    <td>  98,852.42 </td>
    <td>  47,589.18 </td>
  </tr>
</table>


<p>The metric is the query mixes per hour from the BSBM test driver output.  For the interested, the complete output is <a href="http://www.openlinksw.com/weblog/oerling/texts/bsbmres.txt" id="link-id1119f770">here</a>.</p>

<p>The benchmark is pure <a href="http://dbpedia.org/resource/SQL" id="link-id0x5257718">SQL</a>, nothing to do with <a href="http://dbpedia.org/resource/SPARQL" id="link-id0xb8c463e0">SPARQL</a> or <a href="http://dbpedia.org/resource/Resource_Description_Framework" id="link-id0x16e68d50">RDF</a>.</p>

<p>The hardware is 2 x Xeon 5345 (2 x quad core, 2.33 GHz), 16 G RAM.  The OS is 64-bit Debian Linux.</p>

<p>The benchmark was run at a scale of 200,000.  Each run had 2000 warm-up query mixes and 500 measured query mixes, which gives steady state, eliminating any effects of OS disk cache and the like.  Both databases were configured to use 8G for disk cache.  The test effectively runs from memory.  We ran an analyze table on each MySQL table but noticed that this had no effect.  Virtuoso does the stats sampling on the go; possibly MySQL also since the explicit stats did not make any difference.  The MySQL tables were served by the InnoDB engine.  MySQL appears to cache results of queries in some cases.  This was not apparent in the tests.</p>

<p>The versions are 5.09 for Virtuoso and 5.1.29 for MySQL.  You can download and examine --</p>
<ul> 
<li>
<a href="http://www.openlinksw.com/weblog/oerling/texts/virtuoso.ini" id="link-id14fe17f0">Virtuoso configuration file</a>
</li>
<li>
<a href="http://www.openlinksw.com/weblog/oerling/texts/my.cnf" id="link-id116fe490">MySQL configuration file</a>
</li>
<li>
    <a href="http://www.openlinksw.com/weblog/oerling/texts/create_tables_and_rdf_view.sql" id="link-id14ce9268">Table definitions &amp; RDF views</a> 
</li>
<li> <a href="http://www.openlinksw.com/weblog/oerling/texts/mysqlinx.sql" id="link-id1535e298">Indexes on MySQL tables</a>
</li>
</ul>

<p>
<strike>MySQL ought to do better.  We suspect that here, just as in the TPC-D experiment we made way back, the query plans are not quite right. Also we rarely saw over 300% CPU utilization for MySQL.  It is possible there is a config parameter that affects this.  The public is invited to tell us about such.</strike>
</p>

<p>
<b>Update:</b>
</p>

<p>Andreas Schultz of the BSBM team advised us to increase the <code>innodb_buffer_pool_size</code> setting in the MySQL config.  We did and it produced some improvement.  Indeed, this is more like it, as we now see CPU utilization around 700% instead of the 300% in the previously published run, which rendered it suspect. Also, our experiments with TPC-D led us to expect better.  We ran these things a few times so as to have warm cache.</p>

<p>On the first run, we noticed that the Innodb warm up time was somewhere well in excess of 2000 query mixes.  Another time, we should make a graph of throughput as a function of time for both MySQL and Virtuoso.  We recently made a greedy prefetch hack that should give us some mileage there.  For the next BSBM, all we can advise is to run larger scale system for half an hour first and then measure and then measure again.  If the second measurement is the same as the first then it is good.</p>

<p>As always, since MySQL is not our specialty, we confidently invite the public to tell us how to make it run faster. So, unless something more turns up, our next trial is a revisit of <a href="http://dbpedia.org/resource/TPC-H" id="link-id0x122eaa00">TPC-H</a>.</p>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2008-10-31#1468">
  <rss:title>Welcoming Freebase to the Linked Data Web</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2008-10-31T15:02:00Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Finally! That&#39;s all I can say re. Freebase :-) They&#39;ve now plugged their database and their community driven data curation efforts into the burgeoning Linked Data Web. Here are some examples of how we distill Entities (People, Places, Music, and other things) from Freebase (X)HTML pages (meaning: we don&#39;t have to start from RDF information resources as data sources for the eventual RDF Linked Data we generate): Barack Obama Hillary Rodham Clinton Johan McCain Tip: Install our OpenLink Data Explorer extension for Firefox. Once installed, simply browse through Freebase, and whenever you encounter a page about something of interest, simply use the following sequences to distill (via the Page Description feature) the entities from the page you are reading: CTRL-Click (Mac OS X) Right+Click (Windows &amp; Linux) Related State of the Linked Data Web Dynamic Linked Data Web Constellation</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[Finally! That&#39;s all I can say re. Freebase :-) They&#39;ve now plugged their database and their community driven <a href="http://dbpedia.org/resource/Data">data</a> curation efforts into the burgeoning <a href="http://dbpedia.org/resource/Linked_Data" id="link-id111fe3b0">Linked Data</a> <a href="http://dbpedia.org/resource/Giant_Global_Graph" id="link-id1cd46860">Web</a>.

<p>Here are some examples of how we distill Entities (People, Places, Music, and other things) from Freebase (X)HTML pages (meaning: we don&#39;t have to start from RDF <a href="http://dbpedia.org/resource/Information" id="link-id1115cfe8">information</a> resources as data sources for the eventual RDF Linked Data we generate):</p>

<ul>
<li>
<a href="http://linkeddata.uriburner.com/about/html/http://www.freebase.com/view/en/barack_obama" id="link-id1957da00">Barack Obama</a>
</li>
<li>
<a href="http://linkeddata.uriburner.com/about/html/http://www.freebase.com/view/en/hillary_rodham_clinton" id="link-id175786d8">Hillary Rodham Clinton</a>
</li>
<li>
<a href="http://linkeddata.uriburner.com/about/html/http://www.freebase.com/view/en/john_mccain" id="link-id1c7ada58">Johan McCain</a>
</li>
</ul>

<p>Tip: Install our <a href="http://ode.openlinksw.com" id="link-id17a69a20">OpenLink Data Explorer</a> extension for Firefox. Once installed, simply browse through Freebase, and whenever you encounter a page about something of interest, simply use the following sequences to distill (via the Page Description feature) the entities from the page you are reading:</p>
<ul>
<li>
CTRL-Click (Mac OS X)
</li>
<li>
Right+Click (Windows &amp; Linux)
</li>
</ul>
<h3>Related</h3>
<ul>
<li>
  <a href="http://www.openlinksw.com/dataspace/kidehen@openlinksw.com/weblog/kidehen@openlinksw.com%27s%20BLOG%20%5B127%5D/1455" id="link-id17758840">State of the Linked Data Web</a>
</li>
<li>
  <a href="http://www.openlinksw.com/dataspace/kidehen@openlinksw.com/weblog/kidehen@openlinksw.com%27s%20BLOG%20%5B127%5D/1454" id="link-idea627e8">Dynamic Linked Data Web Constellation</a>
</li>
</ul>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2008-10-24#1461">
  <rss:title>Virtuoso, PHP 3.5 Runtime Hosting, phpBB3, and Linked Data</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2008-10-24T19:55:00Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Runtime hosting is functionality realm of Virtuoso that is sometimes easily overlooked. In this post I want to provide a simple no-hassles HOWTO guide for installing Virtuoso on Windows (32 or 64 Bit), Mac OS X (Universal or Native 64 Bit), and Linux (32 or 64 Bit). The installation guide also covers the instantiation of phpBB3 as verification of the Virtuoso hosted PHP 3.5 runtime. What are the benefits of PHP Runtime Hosting? Simple, this means that like Apache, Virtuoso is a bona-fide Web Application Server for an PHP application. Unlike Apache, Virtuoso is also the following: a DBMS Engine (SQL, XML, RDF, and unstructured Text) that is accessible via industry standard interfaces (solely) a Virtual DBMS or Master Data Manager (MDM) for heterogeneous and distributed SQL, XML, RDF, unstructured Text based data sources an RDF Middleware solution for RDF-zation of non RDF resources across the Web and enterprise Intranets and/or Extranets (in the form of Cartridges for SOA &amp; REST Servers and RDF Views (Semantic Covers) over SQL and/or XML data sources) an RDF Linked Data Server (meaning it can deploy RDF Linked Data) As result of the above, when you deploy a PHP application using Virtuoso, you inherit the following benefits: Use of PHP-iODBC for in-process communication with Virtuoso Easy generation of RDF Linked Data from the SQL schemas of PHP applications Easy deployment of RDF Linked Data Less LAMP monoculture (*there is no such thing as virtuous monoculture*) when dealing with PHP based Web applications. As indicated in prior posts, producing RDF Linked Data from the existing Web, where a lot of content is deployed by PHP based content managers, should simply come down to RDF Views over the SQL Schemas and deployment / publishing of the RDF Views in RDF Linked data form. In a nutshell, this is what Virtuoso delivers via its PHP runtime hosting and pre packaged VADs (Virtuoso Application Distribution packages) for popular PHP based applications such as: phpBB3, Drupal, WordPress, and MediaWiki. In addition, to the RDF Linked Data deployment, we&#39;ve also taken the traditional LAMP installation tedium out of the typical PHP application deployment process. For instance, you don&#39;t have to rebuild PHP 3.5 (32 or 64 Bit) on Windows, Mac OS X, or Linux to get going, simply install Virtuoso, and then select a VAD package for the relevant application and you&#39;re set. If the application of choice isn&#39;t pre packaged by us, simply install as you would when using Apache, which comes dow to situating the PHP files in your Web structure under the Web Application&#39;s root directory. Installation Guide Download the Virtuoso installer for Windows (32 Bit msi file or 64 Bit msi file), Mac OS X (Universal Binary dmg file), or instantiate the Virtuoso EC2 AMI search for pattern: &quot;OpenLink, when using the Firefox extension or Web Interface based EC2 management consoles or look for: Â AMI ID: ami-c46084ad and Manifest Name: openlink/virtuoso-uim-unisvr-psnl/5.0/i686-fedora-linux-9.manifest.xml (32 bit edition) AMI ID:Â  ami-59628630 and Manifest Name: openlink/virtuoso-uim-unisvr-psnl/5.0/i686-fedora-linux-9.manifest.xml (64 bit edition)Â  Run the installer (or download the movies using the links in the related section below) Go to the Virtuoso Conductor (*which will show up at the end of the installation process* or go to http://localhost:8890/conductor) Go to the &quot;Admin&quot; tab within the (X)HTML based UI and select the &quot;Packages&quot; sub-menu item (a Tab) Pick phpBB3 (or any other pre-packaged PHP app) and then click on &quot;Install/Upgrase&quot; The watch one of my silent movies or read the initial startup guides for Virtuoso hosted phpBB3, Drupal, Wordpress, MediaWiki. Related At the current time, I&#39;ve only provided links to ZIP files containing the Virtuoso installation &quot;silent movies&quot;. This approach is a short-term solution to some of my current movie publishing challenges re. YouTube and Vimeo -- where the compressed output hasn&#39;t been of acceptable visual quality. Once resolved, I will publish much more &quot;Multimedia Web&quot; friendly movies :-) Windows Vista (x64) Installation Movie Mac OS X (x64 &amp; Universal binary) Installation Movie Virtuoso EC2 Cloud Edition Installation Movie</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
 <p>Runtime hosting is functionality realm of <a href="http://virtuoso.openlinksw.com" id="link-id1189fee8">Virtuoso</a> that is sometimes easily overlooked. In this post I want to provide a simple no-hassles HOWTO guide for installing Virtuoso on Windows (32 or 64 Bit), Mac OS X (Universal or Native 64 Bit), and Linux (32 or 64 Bit). The installation guide also covers the instantiation of <a href="http://dbpedia.org/resource/PhpBB" id="link-id118af3a8">phpBB3</a> as verification of the Virtuoso hosted <a href="http://dbpedia.org/resource/PHP" id="link-id12736b88">PHP</a> 3.5 runtime.</p>  <h3>What are the benefits of PHP Runtime Hosting?</h3>  <p>Simple, this means that like <a href="http://dbpedia.org/resource/Apache" id="link-id111ca408">Apache</a>, Virtuoso is a bona-fide <a href="http://dbpedia.org/resource/World_Wide_Web" id="link-id0xba014968">Web</a> <a href="http://dbpedia.org/resource/Application_server" id="link-id110d2aa8">Application Server</a> for an PHP application. Unlike Apache, Virtuoso is also the following:</p>  <ul> <li>a DBMS Engine (<a href="http://dbpedia.org/resource/SQL" id="link-id10f43d78">SQL</a>, XML, RDF, and unstructured Text) that is accessible via industry standard interfaces (solely)</li> <li>a Virtual DBMS or Master <a href="http://dbpedia.org/resource/Data" id="link-id0x141b0a20">Data</a> Manager (MDM) for heterogeneous and distributed SQL, XML, RDF, unstructured Text based data sources</li> <li>an <a href="http://www.openlinksw.com/weblog/public/search.vspx?blogid=127&amp;q=rdf%20middleware&amp;type=text&amp;output=html" id="link-id1116aad8">RDF Middleware</a> solution for RDF-zation of non RDF resources across the Web and enterprise Intranets and/or Extranets (in the form of Cartridges for SOA &amp; REST Servers and RDF Views (Semantic Covers) over SQL and/or XML data sources)</li> <li>an RDF <a href="http://dbpedia.org/resource/Linked_Data" id="link-id10fbe088">Linked Data</a> Server (meaning it can deploy RDF Linked Data)</li> </ul>  <p>As result of the above, when you deploy a PHP application using Virtuoso, you inherit the following benefits:</p> <ol> <li>Use of PHP-<a href="http://www.iodbc.org" id="link-id1159e070">iODBC</a> for in-process communication with Virtuoso</li> <li>Easy generation of RDF Linked Data from the SQL schemas of PHP applications</li> <li>Easy deployment of RDF Linked Data</li> <li>Less <a href="http://dbpedia.org/resource/LAMP_stack" id="link-id1179dff0">LAMP</a> monoculture (*there is no such thing as virtuous monoculture*) when dealing with PHP based Web applications. </li> </ol>  <p>As indicated in prior posts, producing RDF Linked Data from the existing Web, where a lot of content is deployed by PHP based content managers, should simply come down to RDF Views over the SQL Schemas and deployment / publishing of the RDF Views in RDF Linked data form. In a nutshell,  this is what Virtuoso delivers via its PHP runtime hosting and pre packaged VADs (Virtuoso Application Distribution packages) for popular PHP based applications such as: phpBB3, <a href="http://dbpedia.org/resource/Drupal" id="link-id111ff1c0">Drupal</a>, <a href="http://dbpedia.org/resource/WordPress" id="link-id111e26f8">WordPress</a>, and <a href="http://dbpedia.org/resource/MediaWiki" id="link-id10ea0258">MediaWiki</a>.</p>  <p>In addition, to the RDF Linked Data deployment, we&#39;ve also taken the traditional LAMP installation tedium out of the typical PHP application deployment process. For instance, you don&#39;t have to rebuild PHP 3.5 (32 or 64 Bit) on Windows, Mac OS X, or Linux to get going, simply install Virtuoso, and then select a VAD package for the relevant application and you&#39;re set. If the application of choice isn&#39;t pre packaged by us, simply install as you would when using Apache, which comes dow to situating the PHP files in your Web structure under the Web Application&#39;s root directory.</p>  <h3>Installation Guide</h3> <ol> <li>Download the Virtuoso installer for Windows (<a href="http://virtuoso-installers.s3.amazonaws.com/virt50_server_Windows_x86_32-20081022.msi" id="link-id1160cc80">32 Bit msi file</a> or <a href="http://virtuoso-installers.s3.amazonaws.com/virt50_server_Windows_x86_64-20081022.msi" id="link-id11239828">64 Bit msi file</a>), Mac OS X (<a href="http://virtuoso-installers.s3.amazonaws.com/Virtuoso-PersonalEdition-V5.0-MacOSX-10.5-Universal.dmg" id="link-id110511f8">Universal Binary dmg file</a>), or instantiate the <a href="http://www.openlinksw.com/oat/wiki/main/Main/ODSInstallationEC2" id="link-id111fe248">Virtuoso EC2 AMI</a> search for pattern: &quot;OpenLink, when using the Firefox extension or Web Interface based EC2 management consoles or look for:</li>  <ul>   <li>Â AMI ID: ami-c46084ad and Manifest Name: openlink/virtuoso-uim-unisvr-psnl/5.0/i686-fedora-linux-9.manifest.xml (32 bit edition)   </li>   <li>AMI ID:Â  ami-59628630 and Manifest Name: openlink/virtuoso-uim-unisvr-psnl/5.0/i686-fedora-linux-9.manifest.xml (64 bit edition)<br />Â    </li>  </ul> <li>Run the installer (or download the movies using the links in the related section below)</li> <li>Go to the Virtuoso Conductor (*which will show up at the end of the installation process* or go to http://localhost:8890/conductor)</li> <li>Go to the &quot;Admin&quot; tab within the (X)HTML based UI and select the &quot;Packages&quot; sub-menu item (a Tab)</li> <li>Pick phpBB3 (or any other pre-packaged PHP app) and then click on &quot;Install/Upgrase&quot;</li> <li>The watch one of my silent movies or read the initial startup guides for Virtuoso hosted phpBB3, Drupal, Wordpress, MediaWiki.</li> </ol> <h3>Related</h3> <p> At the current time, I&#39;ve only provided links to ZIP files containing the Virtuoso installation &quot;silent movies&quot;. This approach is a short-term solution to some of my current movie publishing challenges re. YouTube and Vimeo -- where the compressed output hasn&#39;t been of acceptable visual quality. Once resolved, I will publish much more &quot;Multimedia Web&quot; friendly movies :-)</p> <ul> <li>   <a href="http://my-movies.s3.amazonaws.com/Virtuoso_PHPBB3_Vista_Linked_Data_Demo.mov.zip" id="link-id11642450">Windows Vista (x64) Installation Movie</a> </li> <li>   <a href="http://my-movies.s3.amazonaws.com/Virtuoso_PHPBB3_MacOSX_Linked_Data_Demo.mov.zip" id="link-id11210498">Mac OS X (x64 &amp; Universal binary) Installation Movie</a> </li> <li>   <a href="http://my-movies.s3.amazonaws.com/Virtuoso_PHPBB3_EC2_AMI_Linked_Data_Demo.zip" id="link-id111ff268">Virtuoso EC2 Cloud Edition Installation Movie</a> </li> </ul>  
]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2008-09-05#1430">
  <rss:title>Linked Data, Ubiquity Commands, and Resource Descriptions (Update 3)</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2008-09-05T05:43:00Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Ubiquity from Mozilla Labs, provides an alternative entry point for experiencing the &quot;Controller&quot; aspect of the Web&#39;s natural compatibility with the MVC development pattern. As I&#39;ve noted (in various posts) Web Services, as practiced by the REST oriented Web 2.0 community or SOAP oriented SOA community within the enterprise, is fundamentally about the (&quot;Controller&quot; aspect of MVC. Ubiquity provides a commandline interface for direct invocation of Web Services. For instance, in our case, we can expose the Virtuoso&#39;s in-built RDF Middleware (&quot;Sponger&quot;) and Linked Data deployment services via a single command of the form: describe-resource &lt;url&gt; To experience this neat addition to Firefox you need to do the following:Download and install the Ubiquity Extension for FirefoxSubscribe to the OpenLink Command for Resource DescriptionClick on CTRL+Space (Windows / Linux) or Option+Space (Mac OS X)Type in: describe-resource &lt;a-web-resource-url&gt; How to unsubscribe At the current time, you need to do this if you&#39;ve installed commands using ubiquity 0.1.0 and seek to use newer versions of the same commands after upgrading to ubiquity 0.1.1. To unsubscribe use type &quot;about:ubiquity&quot; into browserClick on unsubscribe links associated with you command subscription list Enjoy!</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div><p><a href="http://labs.mozilla.com/2008/08/introducing-ubiquity/" id="link-id11258ea0">Ubiquity</a> from 
	<a href="http://labs.mozilla.com/" id="link-id112ebe28">Mozilla Labs</a>, 
	provides an alternative entry point for experiencing the "Controller" aspect of the 
	<a href="http://dbpedia.org/resource/World_Wide_Web" id="link-id0xa0d2ccd0">Web</a>'s natural compatibility with the 
	<a href="http://dbpedia.org/resource/Model-view-controller" id="link-id10ec1a08">MVC</a> development pattern. As I've noted (in <a href="http://myopenlink.net/weblog/public/search.vspx?blogid=kidehen-blog-0&amp;q=mvc&amp;type=text&amp;output=html" id="link-id15390f28">various posts</a>) <a href="http://dbpedia.org/resource/World_Wide_Web">Web</a> Services, as practiced by the REST oriented Web 2.0 community or SOAP oriented SOA community within the enterprise, is fundamentally about the ("Controller" aspect of <a href="http://dbpedia.org/resource/Model-view-controller" id="link-id13c0d758">MVC</a>. </p><p>Ubiquity provides a commandline interface for direct invocation of Web Services. For instance, in our case, we can expose the <a href="http://virtuoso.openlinksw.com" id="link-id10b04708">Virtuoso</a>'s in-built <a href="http://www.openlinksw.com/weblog/public/search.vspx?blogid=127&amp;q=rdf%20middleware&amp;type=text&amp;output=html" id="link-id1113ae38">RDF Middleware</a> ("Sponger") and <a href="http://dbpedia.org/resource/Linked_Data" id="link-id1457b3b8">Linked Data</a> deployment services via a single command of the form: describe-resource &lt;url&gt; </p><p>To experience this neat addition to Firefox you need to do the following:</p><ol><li><a href="https://people.mozilla.com/%7Eavarma/ubiquity-0.1.1.xpi" id="link-id13b15e88">Download</a> and install the Ubiquity Extension for Firefox</li><li><a href="http://demo.openlinksw.com/ubiq" id="link-id10e85880">Subscribe</a> to the OpenLink Command for Resource Description</li><li>Click on CTRL+Space (Windows / Linux) or Option+Space (Mac OS X)</li><li>Type in: describe-resource &lt;a-web-resource-url&gt;  </li></ol><h3>How to unsubscribe</h3> At the current time, you need to do this if you've installed commands using ubiquity 0.1.0 and seek to use newer versions of the same commands after upgrading to ubiquity 0.1.1.  <ol><li>To unsubscribe use type "about:ubiquity" into browser</li><li>Click on unsubscribe links associated with you command subscription list</li></ol> <p>Enjoy!</p></div>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/vdb/blog/?date=2008-08-06#1410">
  <rss:title>BSBM With Triples and Mapped Relational Data</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2008-08-06T19:41:50Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">BSBM With Triples and Mapped Relational Data The special contribution of the Berlin SPARQL Benchmark (BSBM) to the RDF world is to raise the question of doing OLTP with RDF. Of course, here we immediately hit the question of comparisons with relational databases. To this effect, BSBM also specifies a relational schema and can generate the data as either triples or SQL inserts. The benchmark effectively simulates the case of exposing an existing RDBMS as RDF. OpenLink Software calls this RDF Views. Oracle is beginning to call this semantic covers. The RDB2RDF XG, a W3C incubator group, has been active in this area since Spring, 2008. But why an OLTP workload with RDF to begin with? We believe this is relevant because RDF promises to be the interoperability factor between potentially all of traditional IS. If data is online for human consumption, it may be online via a SPARQL end-point as well. The economic justification will come from discoverability and from applications integrating multi-source structured data. Online shopping is a fine use case. Warehousing all the world&#39;s publishable data as RDF is not our first preference, nor would it be the publisher&#39;s. Considerations of duplicate infrastructure and maintenance are reason enough. Consequently, we need to show that mapping can outperform an RDF warehouse, which is what we&#39;ll do here. What We Got First, we found that making the query plan took much too long in proportion to the run time. With BSBM this is an issue because the queries have lots of joins but access relatively little data. So we made a faster compiler and along the way retouched the cost model a bit. But the really interesting part with BSBM is mapping relational data to RDF. For us, BSBM is a great way of showing that mapping can outperform even the best triple store. A relational row store is as good as unbeatable with the query mix. And when there is a clear mapping, there is no reason the SPARQL could not be directly translated. If Chris Bizer et al launched the mapping ship, we will be the ones to pilot it to harbor! We filled two Virtuoso instances with a BSBM200000 data set, for 100M triples. One was filled with physical triples; the other was filled with the equivalent relational data plus mapping to triples. Performance figures are given in &quot;query mixes per hour&quot;. (An update or follow-on to this post will provide elapsed times for each test run.) With the unmodified benchmark we got: Physical Triples: Â  Â  1297 qmph Mapped Triples: Â  Â  3144 qmph In both cases, most of the time was spent on Q6, which looks for products with one of three words in the label. We altered Q6 to use text index for the mapping, and altered the databases accordingly. (There is no such thing as an e-commerce site without a text index, so we are amply justified in making this change.) The following were measured on the second run of a 100 query mix series, single test driver, warm cache. Physical Triples: Â  Â  5746 qmph Mapped Triples: Â  Â  7525 qmph We then ran the same with 4 concurrent instances of the test driver. The qmph here is 400 / the longest run time. Physical Triples: Â  Â  19459 qmph Mapped Triples: Â  Â  24531 qmph The system used was 64-bit Linux, 2GHz dual-Xeon 5130 (8 cores) with 8G RAM. The concurrent throughputs are a little under 4 times the single thread throughput, which is normal for SMP due to memory contention. The numbers do not evidence significant overhead from thread synchronization. The query compilation represents about 1/3 of total server side CPU. In an actual online application of this type, queries would be parameterized, so the throughputs would be accordingly higher. We used the StopCompilerWhenXOverRunTime = 1 option here to cut needless compiler overhead, the queries being straightforward enough. We also see that the advantage of mapping can be further increased by more compiler optimizations, so we expect in the end mapping will lead RDF warehousing by a factor of 4 or so. Suggestions for BSBM Reporting Rules. The benchmark spec should specify a form for disclosure of test run data, TPC style. This includes things like configuration parameters and exact text of queries. There should be accepted variants of query text, as with the TPC. Multiuser operation. The test driver should get a stream number as parameter, so that each client makes a different query sequence. Also, disk performance in this type of benchmark can only be reasonably assessed with a naturally parallel multiuser workload. Add business intelligence. SPARQL has aggregates now, at least with Jena and Virtuoso, so let&#39;s use these. The BSBM business intelligence metric should be a separate metric off the same data. Adding synthetic sales figures would make more interesting queries possible. For example, producing recommendations like &quot;customers who bought this also bought xxx.&quot; For the SPARQL community, BSBM sends the message that one ought to support parameterized queries and stored procedures. This would be a SPARQL protocol extension; the SPARUL syntax should also have a way of calling a procedure. Something like select proc (??, ??) would be enough, where ?? is a parameter marker, like ? in ODBC/JDBC. Add transactions.Especially if we are contrasting mapping vs. storing triples, having an update flow is relevant. In practice, this could be done by having the test driver send web service requests for order entry and the SUT could implement these as updates to the triples or a mapped relational store. This could use stored procedures or logic in an app server. Comments on Query Mix The time of most queries is less than linear to the scale factor. Q6 is an exception if it is not implemented using a text index. Without the text index, Q6 will inevitably come to dominate query time as the scale is increased, and thus will make the benchmark less relevant at larger scales. Next We include the sources of our RDF view definitions and other material for running BSBM with our forthcoming Virtuoso Open Source 5.0.8 release. This also includes all the query optimization work done for BSBM. This will be available in the coming days.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div>
<div style="display:none;">BSBM With Triples and Mapped Relational Data</div>
<p>The special contribution of the <a href="http://www4.wiwiss.fu-berlin.de/bizer/BerlinSPARQLBenchmark/spec/index.html" id="link-id10039db0">Berlin SPARQL Benchmark</a> (<a href="http://www4.wiwiss.fu-berlin.de/bizer/BerlinSPARQLBenchmark/spec/index.html" id="link-id106b2538">BSBM</a>) to the <a href="http://dbpedia.org/resource/Resource_Description_Framework" id="link-id101a75f8">RDF</a> world is to raise the question of doing OLTP with <a href="http://dbpedia.org/resource/Resource_Description_Framework" id="link-id0xae54170">RDF</a>.</p>

<p>Of course, here we immediately hit the question of comparisons with relational databases.  To this effect, <a href="http://www4.wiwiss.fu-berlin.de/bizer/BerlinSPARQLBenchmark/spec/index.html" id="link-id0x1e847b08">BSBM</a> also specifies a relational schema and can generate the <a href="http://dbpedia.org/resource/Data" id="link-id1206c378">data</a> as either triples or <a href="http://dbpedia.org/resource/SQL" id="link-id1667f040">SQL</a> inserts.</p>

<p>The benchmark effectively simulates the case of exposing an existing <a href="http://dbpedia.org/resource/Relational_database_management_system" id="link-id10a93518">RDBMS</a> as RDF.  <a href="http://www.openlinksw.com/dataspace/organization/openlink#this" id="link-id13e46d80">OpenLink Software</a> calls this <i>RDF Views</i>.  <a href="http://dbpedia.org/resource/Oracle_Database" id="link-id12027578">Oracle</a> is beginning to call this <i>semantic covers</i>.  The <a href="http://www.w3.org/2005/Incubator/rdb2rdf/" id="link-id161dc678">RDB2RDF XG</a>, a W3C incubator group, has been active in this area since Spring, 2008.</p>

<h3>But why an OLTP workload with RDF to begin with?</h3>

<p>We believe this is relevant because RDF promises to be the interoperability factor between potentially all of traditional IS.  If <a href="http://dbpedia.org/resource/Data" id="link-id0x1e7119d8">data</a> is online for human consumption, it may be online via a <a href="http://dbpedia.org/resource/SPARQL" id="link-id106a8908">SPARQL</a> end-point as well.  The economic justification will come from discoverability and from applications integrating multi-source structured data.  Online shopping is a fine use case.</p>

<p>Warehousing all the world&#39;s publishable data as RDF is not our first preference, nor would it be the publisher&#39;s.  Considerations of duplicate infrastructure and maintenance are reason enough.  Consequently, we need to show that mapping can outperform an RDF warehouse, which is what we&#39;ll do here.</p>

<h3>What We Got </h3>

<p>First, we found that <a href="http://www.openlinksw.com/dataspace/oerling/weblog/Orri%20Erling%27s%20Blog/1400" id="link-id150ea748">making the query plan took much too long</a> in proportion to the run time.  With BSBM this is an issue because the queries have lots of joins but access relatively little data.  So we made a faster compiler and along the way retouched the cost model a bit.</p>

<p>But the really interesting part with BSBM is mapping relational data to RDF.  For us, BSBM is a great way of showing that mapping can outperform even the best triple store.  A relational row store is as good as unbeatable with the query mix.  And when there is a clear mapping, there is no reason the <a href="http://dbpedia.org/resource/SPARQL" id="link-id0xae5aff0">SPARQL</a> could not be directly translated.</p>

<p>If Chris Bizer et al launched the mapping ship, we will be the ones to pilot it to harbor!</p>

<p>We filled two <a href="http://virtuoso.openlinksw.com" id="link-id12dbdc70">Virtuoso</a> instances with a BSBM200000 data set, for 100M triples.  One was filled with physical triples; the other was filled with the equivalent relational data plus mapping to triples.  Performance figures are given in &quot;query mixes per hour&quot;.  (An update or follow-on to this post will provide elapsed times for each test run.)</p>

<p>With the unmodified benchmark we got:</p>
<blockquote>
<table>
<tr>
   <td><i>Physical Triples:</i>
   </td>
    <td>Â  Â </td>
    <td>1297 qmph</td>
  </tr>
<tr>
   <td><i>Mapped Triples:</i>
   </td>
    <td>Â  Â </td>
   <td><b>3144 qmph</b>
   </td>
  </tr>
</table>
</blockquote>
<p>In both cases, most of the time was spent on Q6, which looks for products with one of three words in the label.  We altered Q6  to use text index for the mapping, and altered the databases accordingly. (There is no such thing as an e-commerce site without a text index, so we are amply justified in making this change.)</p>

<p>The following were measured on the second run of a 100 query mix series, single test driver, warm cache.</p>
<blockquote>
<table>
<tr>
   <td><i>Physical Triples:</i>
   </td>
    <td>Â  Â </td>
    <td> 5746 qmph</td>
  </tr>
<tr>
   <td><i>Mapped Triples:</i>
   </td>
    <td>Â  Â </td>
   <td> <b>7525 qmph</b>
   </td>
  </tr>
</table>
</blockquote>
<p>We then ran the same with 4 concurrent instances of the test driver. The qmph here is 400 / the longest run time.</p>
<blockquote>
<table>
<tr>
   <td><i>Physical Triples:</i>
   </td>
    <td>Â  Â </td>
    <td> 19459 qmph</td>
  </tr>
<tr>
   <td><i>Mapped Triples:</i>
   </td>
    <td>Â  Â </td>
   <td> <b>24531 qmph</b>
   </td>
  </tr>
</table>
</blockquote>

<p>The system used was 64-bit Linux, 2GHz dual-Xeon 5130 (8 cores) with 8G RAM.  The concurrent throughputs are a little under 4 times the single thread throughput, which is normal for SMP due to memory contention.  The numbers do not evidence significant overhead from thread synchronization.</p>

<p>The query compilation represents about 1/3 of total server side CPU. In an actual online application of this type, queries would be parameterized, so the throughputs would be accordingly higher.  We used the <code>StopCompilerWhenXOverRunTime = 1</code> option here to cut needless compiler overhead, the queries being straightforward enough.</p>

<p>We also see that the advantage of mapping can be further increased by more compiler optimizations, so we expect in the end mapping will lead RDF warehousing by a factor of 4 or so.</p>

<h3>Suggestions for BSBM</h3>

<ul>
 <li>
  <p>
    <b>Reporting Rules.</b> The benchmark spec should specify a form for disclosure of test run data, TPC style.  This includes things like configuration parameters and exact text of queries.  There should be accepted variants of query text, as with the TPC.</p>
 </li>

<li>
  <p>
    <b>Multiuser operation.</b>  The test driver should get a stream number as parameter, so that each client makes a different query sequence. Also, disk performance in this type of benchmark can only be reasonably assessed with a naturally parallel multiuser workload.</p>
</li>

<li>
  <p>
    <b>Add business intelligence.</b>  SPARQL has aggregates now, at least with <a href="http://jena.sourceforge.net/" id="link-id11a25ac0">Jena</a> and <a href="http://virtuoso.openlinksw.com" id="link-id0xb003180">Virtuoso</a>, so let&#39;s use these.  The BSBM business intelligence metric should be a separate metric off the same data.  Adding synthetic sales figures would make more interesting queries possible.  For example, producing recommendations like &quot;customers who bought this also bought xxx.&quot;</p>
</li>

<li>
  <p>
    <b>For the SPARQL community</b>, BSBM sends the message that one ought to support parameterized queries and stored procedures.  This would be a <a href="http://www.w3.org/TR/rdf-sparql-protocol/" id="link-id109e2448">SPARQL protocol</a> extension; the SPARUL syntax should also have a way of calling a procedure.  Something like <code>select proc (??, ??)</code> would be enough, where <code>??</code> is a parameter marker, like <code>?</code> in <a href="http://dbpedia.org/resource/Open_Database_Connectivity" id="link-id13febf48">ODBC</a>/<a href="http://dbpedia.org/resource/Java_Database_Connectivity" id="link-id120416a8">JDBC</a>.</p>
</li>

<li>
  <p>
    <b>Add transactions.</b>Especially if we are contrasting mapping vs. storing triples, having an update flow is relevant.  In practice, this could be done by having the test driver send web service requests for order entry and the SUT could implement these as updates to the triples or a mapped relational store.  This could use stored procedures or logic in an app server.</p>
</li>
</ul>

<h3>Comments on Query Mix</h3>

<p>The time of most queries is less than linear to the scale factor.  Q6 is an exception if it is not implemented using a text index.  Without the text index, Q6 will inevitably come to dominate query time as the scale is increased, and thus will make the benchmark less relevant at larger scales.</p>

<h2>Next</h2>

<p>We include the sources of our RDF view definitions and other material for running BSBM with our forthcoming Virtuoso Open Source 5.0.8 release.  This also includes all the query optimization work done for BSBM.  This will be available in the coming days.</p>
</div>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/weblog/oerling/?date=2008-08-06#1409">
  <rss:title>BSBM With Triples and Mapped Relational Data</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2008-08-06T19:35:27Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">The special contribution of the Berlin SPARQL Benchmark (BSBM) to the RDF world is to raise the question of doing OLTP with RDF. Of course, here we immediately hit the question of comparisons with relational databases. To this effect, BSBM also specifies a relational schema and can generate the data as either triples or SQL inserts. The benchmark effectively simulates the case of exposing an existing RDBMS as RDF. OpenLink Software calls this RDF Views. Oracle is beginning to call this semantic covers. The RDB2RDF XG, a W3C incubator group, has been active in this area since Spring, 2008. But why an OLTP workload with RDF to begin with? We believe this is relevant because RDF promises to be the interoperability factor between potentially all of traditional IS. If data is online for human consumption, it may be online via a SPARQL end-point as well. The economic justification will come from discoverability and from applications integrating multi-source structured data. Online shopping is a fine use case. Warehousing all the world&#39;s publishable data as RDF is not our first preference, nor would it be the publisher&#39;s. Considerations of duplicate infrastructure and maintenance are reason enough. Consequently, we need to show that mapping can outperform an RDF warehouse, which is what we&#39;ll do here. What We Got First, we found that making the query plan took much too long in proportion to the run time. With BSBM this is an issue because the queries have lots of joins but access relatively little data. So we made a faster compiler and along the way retouched the cost model a bit. But the really interesting part with BSBM is mapping relational data to RDF. For us, BSBM is a great way of showing that mapping can outperform even the best triple store. A relational row store is as good as unbeatable with the query mix. And when there is a clear mapping, there is no reason the SPARQL could not be directly translated. If Chris Bizer et al launched the mapping ship, we will be the ones to pilot it to harbor! We filled two Virtuoso instances with a BSBM200000 data set, for 100M triples. One was filled with physical triples; the other was filled with the equivalent relational data plus mapping to triples. Performance figures are given in &quot;query mixes per hour&quot;. (An update or follow-on to this post will provide elapsed times for each test run.) With the unmodified benchmark we got: Physical Triples: Â  Â  1297 qmph Mapped Triples: Â  Â  3144 qmph In both cases, most of the time was spent on Q6, which looks for products with one of three words in the label. We altered Q6 to use text index for the mapping, and altered the databases accordingly. (There is no such thing as an e-commerce site without a text index, so we are amply justified in making this change.) The following were measured on the second run of a 100 query mix series, single test driver, warm cache. Physical Triples: Â  Â  5746 qmph Mapped Triples: Â  Â  7525 qmph We then ran the same with 4 concurrent instances of the test driver. The qmph here is 400 / the longest run time. Physical Triples: Â  Â  19459 qmph Mapped Triples: Â  Â  24531 qmph The system used was 64-bit Linux, 2GHz dual-Xeon 5130 (8 cores) with 8G RAM. The concurrent throughputs are a little under 4 times the single thread throughput, which is normal for SMP due to memory contention. The numbers do not evidence significant overhead from thread synchronization. The query compilation represents about 1/3 of total server side CPU. In an actual online application of this type, queries would be parameterized, so the throughputs would be accordingly higher. We used the StopCompilerWhenXOverRunTime = 1 option here to cut needless compiler overhead, the queries being straightforward enough. We also see that the advantage of mapping can be further increased by more compiler optimizations, so we expect in the end mapping will lead RDF warehousing by a factor of 4 or so. Suggestions for BSBM Reporting Rules. The benchmark spec should specify a form for disclosure of test run data, TPC style. This includes things like configuration parameters and exact text of queries. There should be accepted variants of query text, as with the TPC. Multiuser operation. The test driver should get a stream number as parameter, so that each client makes a different query sequence. Also, disk performance in this type of benchmark can only be reasonably assessed with a naturally parallel multiuser workload. Add business intelligence. SPARQL has aggregates now, at least with Jena and Virtuoso, so let&#39;s use these. The BSBM business intelligence metric should be a separate metric off the same data. Adding synthetic sales figures would make more interesting queries possible. For example, producing recommendations like &quot;customers who bought this also bought xxx.&quot; For the SPARQL community, BSBM sends the message that one ought to support parameterized queries and stored procedures. This would be a SPARQL protocol extension; the SPARUL syntax should also have a way of calling a procedure. Something like select proc (??, ??) would be enough, where ?? is a parameter marker, like ? in ODBC/JDBC. Add transactions.Especially if we are contrasting mapping vs. storing triples, having an update flow is relevant. In practice, this could be done by having the test driver send web service requests for order entry and the SUT could implement these as updates to the triples or a mapped relational store. This could use stored procedures or logic in an app server. Comments on Query Mix The time of most queries is less than linear to the scale factor. Q6 is an exception if it is not implemented using a text index. Without the text index, Q6 will inevitably come to dominate query time as the scale is increased, and thus will make the benchmark less relevant at larger scales. Next We include the sources of our RDF view definitions and other material for running BSBM with our forthcoming Virtuoso Open Source 5.0.8 release. This also includes all the query optimization work done for BSBM. This will be available in the coming days.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p>The special contribution of the <a href="http://www4.wiwiss.fu-berlin.de/bizer/BerlinSPARQLBenchmark/spec/index.html" id="link-id10039db0">Berlin SPARQL Benchmark</a> (<a href="http://www4.wiwiss.fu-berlin.de/bizer/BerlinSPARQLBenchmark/spec/index.html" id="link-id106b2538">BSBM</a>) to the <a href="http://dbpedia.org/resource/Resource_Description_Framework" id="link-id101a75f8">RDF</a> world is to raise the question of doing OLTP with <a href="http://dbpedia.org/resource/Resource_Description_Framework" id="link-id0xb230eb0">RDF</a>.</p>

<p>Of course, here we immediately hit the question of comparisons with relational databases.  To this effect, <a href="http://www4.wiwiss.fu-berlin.de/bizer/BerlinSPARQLBenchmark/spec/index.html" id="link-id0xa832da8">BSBM</a> also specifies a relational schema and can generate the <a href="http://dbpedia.org/resource/Data" id="link-id1206c378">data</a> as either triples or <a href="http://dbpedia.org/resource/SQL" id="link-id1667f040">SQL</a> inserts.</p>

<p>The benchmark effectively simulates the case of exposing an existing <a href="http://dbpedia.org/resource/Relational_database_management_system" id="link-id10a93518">RDBMS</a> as RDF.  <a href="http://www.openlinksw.com/dataspace/organization/openlink#this" id="link-id13e46d80">OpenLink Software</a> calls this <i>RDF Views</i>.  <a href="http://dbpedia.org/resource/Oracle_Database" id="link-id12027578">Oracle</a> is beginning to call this <i>semantic covers</i>.  The <a href="http://www.w3.org/2005/Incubator/rdb2rdf/" id="link-id161dc678">RDB2RDF XG</a>, a W3C incubator group, has been active in this area since Spring, 2008.</p>

<h3>But why an OLTP workload with RDF to begin with?</h3>

<p>We believe this is relevant because RDF promises to be the interoperability factor between potentially all of traditional IS.  If <a href="http://dbpedia.org/resource/Data" id="link-id0xabe48a0">data</a> is online for human consumption, it may be online via a <a href="http://dbpedia.org/resource/SPARQL" id="link-id106a8908">SPARQL</a> end-point as well.  The economic justification will come from discoverability and from applications integrating multi-source structured data.  Online shopping is a fine use case.</p>

<p>Warehousing all the world&#39;s publishable data as RDF is not our first preference, nor would it be the publisher&#39;s.  Considerations of duplicate infrastructure and maintenance are reason enough.  Consequently, we need to show that mapping can outperform an RDF warehouse, which is what we&#39;ll do here.</p>

<h3>What We Got </h3>

<p>First, we found that <a href="http://www.openlinksw.com/dataspace/oerling/weblog/Orri%20Erling%27s%20Blog/1400" id="link-id150ea748">making the query plan took much too long</a> in proportion to the run time.  With BSBM this is an issue because the queries have lots of joins but access relatively little data.  So we made a faster compiler and along the way retouched the cost model a bit.</p>

<p>But the really interesting part with BSBM is mapping relational data to RDF.  For us, BSBM is a great way of showing that mapping can outperform even the best triple store.  A relational row store is as good as unbeatable with the query mix.  And when there is a clear mapping, there is no reason the <a href="http://dbpedia.org/resource/SPARQL" id="link-id0x96bb5e0">SPARQL</a> could not be directly translated.</p>

<p>If Chris Bizer et al launched the mapping ship, we will be the ones to pilot it to harbor!</p>

<p>We filled two <a href="http://virtuoso.openlinksw.com" id="link-id12dbdc70">Virtuoso</a> instances with a BSBM200000 data set, for 100M triples.  One was filled with physical triples; the other was filled with the equivalent relational data plus mapping to triples.  Performance figures are given in &quot;query mixes per hour&quot;.  (An update or follow-on to this post will provide elapsed times for each test run.)</p>

<p>With the unmodified benchmark we got:</p>
<blockquote>
<table>
<tr>
   <td><i>Physical Triples:</i>
   </td>
    <td>Â  Â </td>
    <td>1297 qmph</td>
  </tr>
<tr>
   <td><i>Mapped Triples:</i>
   </td>
    <td>Â  Â </td>
   <td><b>3144 qmph</b>
   </td>
  </tr>
</table>
</blockquote>
<p>In both cases, most of the time was spent on Q6, which looks for products with one of three words in the label.  We altered Q6  to use text index for the mapping, and altered the databases accordingly. (There is no such thing as an e-commerce site without a text index, so we are amply justified in making this change.)</p>

<p>The following were measured on the second run of a 100 query mix series, single test driver, warm cache.</p>
<blockquote>
<table>
<tr>
   <td><i>Physical Triples:</i>
   </td>
    <td>Â  Â </td>
    <td> 5746 qmph</td>
  </tr>
<tr>
   <td><i>Mapped Triples:</i>
   </td>
    <td>Â  Â </td>
   <td> <b>7525 qmph</b>
   </td>
  </tr>
</table>
</blockquote>
<p>We then ran the same with 4 concurrent instances of the test driver. The qmph here is 400 / the longest run time.</p>
<blockquote>
<table>
<tr>
   <td><i>Physical Triples:</i>
   </td>
    <td>Â  Â </td>
    <td> 19459 qmph</td>
  </tr>
<tr>
   <td><i>Mapped Triples:</i>
   </td>
    <td>Â  Â </td>
   <td> <b>24531 qmph</b>
   </td>
  </tr>
</table>
</blockquote>

<p>The system used was 64-bit Linux, 2GHz dual-Xeon 5130 (8 cores) with 8G RAM.  The concurrent throughputs are a little under 4 times the single thread throughput, which is normal for SMP due to memory contention.  The numbers do not evidence significant overhead from thread synchronization.</p>

<p>The query compilation represents about 1/3 of total server side CPU. In an actual online application of this type, queries would be parameterized, so the throughputs would be accordingly higher.  We used the <code>StopCompilerWhenXOverRunTime = 1</code> option here to cut needless compiler overhead, the queries being straightforward enough.</p>

<p>We also see that the advantage of mapping can be further increased by more compiler optimizations, so we expect in the end mapping will lead RDF warehousing by a factor of 4 or so.</p>

<h3>Suggestions for BSBM</h3>

<ul>
 <li>
  <p>
    <b>Reporting Rules.</b> The benchmark spec should specify a form for disclosure of test run data, TPC style.  This includes things like configuration parameters and exact text of queries.  There should be accepted variants of query text, as with the TPC.</p>
 </li>

<li>
  <p>
    <b>Multiuser operation.</b>  The test driver should get a stream number as parameter, so that each client makes a different query sequence. Also, disk performance in this type of benchmark can only be reasonably assessed with a naturally parallel multiuser workload.</p>
</li>

<li>
  <p>
    <b>Add business intelligence.</b>  SPARQL has aggregates now, at least with <a href="http://jena.sourceforge.net/" id="link-id11a25ac0">Jena</a> and <a href="http://virtuoso.openlinksw.com" id="link-id0xa83f490">Virtuoso</a>, so let&#39;s use these.  The BSBM business intelligence metric should be a separate metric off the same data.  Adding synthetic sales figures would make more interesting queries possible.  For example, producing recommendations like &quot;customers who bought this also bought xxx.&quot;</p>
</li>

<li>
  <p>
    <b>For the SPARQL community</b>, BSBM sends the message that one ought to support parameterized queries and stored procedures.  This would be a <a href="http://www.w3.org/TR/rdf-sparql-protocol/" id="link-id109e2448">SPARQL protocol</a> extension; the SPARUL syntax should also have a way of calling a procedure.  Something like <code>select proc (??, ??)</code> would be enough, where <code>??</code> is a parameter marker, like <code>?</code> in <a href="http://dbpedia.org/resource/Open_Database_Connectivity" id="link-id13febf48">ODBC</a>/<a href="http://dbpedia.org/resource/Java_Database_Connectivity" id="link-id120416a8">JDBC</a>.</p>
</li>

<li>
  <p>
    <b>Add transactions.</b>Especially if we are contrasting mapping vs. storing triples, having an update flow is relevant.  In practice, this could be done by having the test driver send web service requests for order entry and the SUT could implement these as updates to the triples or a mapped relational store.  This could use stored procedures or logic in an app server.</p>
</li>
</ul>

<h3>Comments on Query Mix</h3>

<p>The time of most queries is less than linear to the scale factor.  Q6 is an exception if it is not implemented using a text index.  Without the text index, Q6 will inevitably come to dominate query time as the scale is increased, and thus will make the benchmark less relevant at larger scales.</p>

<h2>Next</h2>

<p>We include the sources of our RDF view definitions and other material for running BSBM with our forthcoming Virtuoso Open Source 5.0.8 release.  This also includes all the query optimization work done for BSBM.  This will be available in the coming days.</p>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2008-08-03#1408">
  <rss:title>.NET, LINQ, and RDF based Linked Data (Update 2)</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2008-08-03T16:07:09Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">At OpenLink, we&#39;ve been investigating LinqToRdf, an exciting project from Andrew Matthews that seeks to expose the Semantic Web technology space to the large community of .NET developers. The LinqToRdf project is about binding LINQ to RDF. It sits atop Joshua Tauberer&#39;s C# based Semantic Web/RDF library which has been out there for a while and works across Microsoft .NET and it&#39;s open source variant &quot;Mono&quot;. Historically, the Semantic Web realm has been dominated by RDF frameworks such as Sesame, Jena and Redland; which by their Open Source orientation, predominantly favor non-Windows platforms (Java and Linux). Conversely, Microsoft&#39;s .NET frameworks have sought to offer Conceptualization technology for heterogeneous Logical Data Sources via .NET&#39;s Entity Frameworks and ADO.NET, but without any actual bindings to RDF. Interestingly, believe it or not, .NET already has a data query language that shares a number of similarities with SPARQL, called Entity-SQL, and a very innovative programming language called LINQ; that offers a blend of constructs for natural data access and manipulation across relational (SQL), hierarchical (XML), and graph (Object) models without the traditional object language-&gt;database impedance tensions of the past. With regards to all of the above, we&#39;ve just released a mini white paper that covers the exploitation of RDF-based Linked Data using .NET via LINQ. The paper offers a an overview of LinqToRdf, plus enhancements we&#39;ve contributed to the project (available in LinqToRdf v0.8.). The paper includes real-world examples that tap into a MusicBrainz powered Linked Data Space, the Music Ontology, the Virtuoso RDF Quad Store, Virtuoso Sponger Middleware, and our RDfization Cartridges for Musicbrainz. Enjoy!</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p>At OpenLink, we&#39;ve been investigating <a href="http://code.google.com/p/linqtordf/" id="link-id1296eb18">LinqToRdf</a>, an exciting project from <a href="http://aabs.wordpress.com/" id="link-id13e860a8">Andrew Matthews</a> that seeks to expose the <a href="http://dbpedia.org/resource/Semantic_Web" id="link-id105d84f8">Semantic Web</a> technology space to the large community of .NET developers. </p>
<p>The LinqToRdf project is about binding LINQ to RDF. It sits atop <a href="http://razor.occams.info/" id="link-id102e3b10">Joshua Tauberer</a>&#39;s <a href="http://dbpedia.org/resource/C_(programming_language)" id="link-id1471b0d0">C</a># based <a href="http://razor.occams.info/code/semweb/" id="link-id14cb9030">Semantic Web/RDF library</a> which has been out there for a while and works across Microsoft .NET and it&#39;s open source variant &quot;Mono&quot;.</p>

<p>Historically, the <a href="http://dbpedia.org/resource/Semantic_Web" id="link-id13ee9f40">Semantic Web</a> realm has been dominated by RDF
frameworks  such as <a href="http://www.openrdf.org/" id="link-id109f8a68">Sesame</a>, <a href="http://jena.sourceforge.net/" id="link-id144c3210">Jena</a> and <a href="http://librdf.org/" id="link-id10600228">Redland</a>; which by their Open
Source orientation, predominantly favor non-Windows platforms (Java and
Linux). Conversely, Microsoft&#39;s .NET frameworks have sought to offer
Conceptualization technology for heterogeneous Logical <a href="http://dbpedia.org/resource/Data">Data</a> Sources via
.NET&#39;s <a href="http://en.wikipedia.org/wiki/ADO.NET_Entity_Framework" id="link-id10726628">Entity Frameworks</a> and <a href="http://dbpedia.org/resource/ADO.NET" id="link-id13e7edd8">ADO.NET</a>, but without any actual bindings
to RDF. </p>
<p>Interestingly, believe it or not, .NET already has a data query
language that shares a number of similarities with <a href="http://dbpedia.org/resource/SPARQL" id="link-id1042f480">SPARQL</a>, called
<a href="http://dbpedia.org/resource/Entity" id="link-id105a46b0">Entity</a>-<a href="http://dbpedia.org/resource/SQL" id="link-id1041d2e8">SQL</a>, and a very innovative programming language called LINQ;
that offers a blend of constructs for natural data access and
manipulation across relational (<a href="http://dbpedia.org/resource/SQL" id="link-id139f5848">SQL</a>), hierarchical (XML), and graph
(Object) models without the traditional object language-&gt;database
impedance tensions of the past.</p>

<p>With regards to all of the above, we&#39;ve just released a mini white paper that covers the exploitation of <a href="http://virtuoso.openlinksw.com/Whitepapers/html/linqtordf/linqtordf1.htm" id="link-id14b2f138">RDF-based Linked Data using .NET via LINQ</a>. The paper offers a an overview of LinqToRdf, plus enhancements we&#39;ve contributed to the project (available in  <a href="http://aabs.wordpress.com/2008/08/01/announcing-linqtordf-v08/" id="link-id101defa8">LinqToRdf v0.8</a>.).
The paper includes real-world examples that tap into a MusicBrainz
powered <a href="http://dbpedia.org/resource/Linked_Data" id="link-id101ffd18">Linked Data</a> <a href="http://en.wikipedia.org/wiki/Data_Spaces" id="link-id105cb858">Space</a>, the Music Ontology, the <a href="http://virtuoso.openlinksw.com" id="link-id13f55860">Virtuoso</a> RDF Quad
Store, <a href="http://virtuoso.openlinksw.com" id="link-id12826718">Virtuoso</a> <a href="http://virtuoso.openlinksw.com/Whitepapers/html/VirtSpongerWhitePaper.html" id="link-id1030cb60">Sponger</a> Middleware, and our RDfization Cartridges for
Musicbrainz. </p>
Enjoy!]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/vdb/blog/?date=2008-07-30#1401">
  <rss:title>Virtuoso Optimizations for the Berlin SPARQL Benchmark </rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2008-07-30T18:52:11Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Virtuoso Optimizations for the Berlin SPARQL Benchmark We had a look at Chris Bizer&#39;s initial results with the Berlin SPARQL Benchmark (BSBM) on Virtuoso. The first results were rather bad, as nearly all of the run time was spent optimizing the SPARQL statements and under 10% actually running them. So I spent a couple of days on the SPARQL/SQL compiler, to the effect of making it do a better guess of initial execution plan and streamlining some operations. In fact, many of the queries in BSBM are not particularly sensitive to execution plan, as they access a very small portion of the database. So to close the matter, I put in a flag that makes the SQL compiler give up on devising new plans if the time of the best plan so far is less than the time spent compiling so far. With these changes, available now as a diff on top of 5.0.7, we run quite well, several times better than initially. With the compiler time cut-off in place (ini parameter StopCompilerWhenXOverRunTime = 1), we get the following times, output from the BSBM test driver: Starting test... 0: 1031.22 ms, total: 1151 ms 1: 982.89 ms, total: 1040 ms 2: 923.27 ms, total: 968 ms 3: 898.37 ms, total: 932 ms 4: 855.70 ms, total: 865 ms Scale factor: 10000 Number of query mix runs: 5 times min/max Query mix runtime: 0.8557 s / 1.0312 s Total runtime: 4.691 seconds QMpH: 3836.77 query mixes per hour CQET: 0.93829 seconds average runtime of query mix CQET (geom.): 0.93625 seconds geometric mean runtime of query mix Metrics for Query 1: Count: 5 times executed in whole run AQET: 0.012212 seconds (arithmetic mean) AQET(geom.): 0.009934 seconds (geometric mean) QPS: 81.89 Queries per second minQET/maxQET: 0.00684000s / 0.03115700s Average result count: 7.0 min/max result count: 3 / 10 Metrics for Query 2: Count: 35 times executed in whole run AQET: 0.030490 seconds (arithmetic mean) AQET(geom.): 0.029776 seconds (geometric mean) QPS: 32.80 Queries per second minQET/maxQET: 0.02467300s / 0.06753000s Average result count: 22.5 min/max result count: 15 / 30 Metrics for Query 3: Count: 5 times executed in whole run AQET: 0.006947 seconds (arithmetic mean) AQET(geom.): 0.006905 seconds (geometric mean) QPS: 143.95 Queries per second minQET/maxQET: 0.00580000s / 0.00795100s Average result count: 4.0 min/max result count: 0 / 10 Metrics for Query 4: Count: 5 times executed in whole run AQET: 0.008858 seconds (arithmetic mean) AQET(geom.): 0.008829 seconds (geometric mean) QPS: 112.89 Queries per second minQET/maxQET: 0.00804400s / 0.01019500s Average result count: 3.4 min/max result count: 0 / 10 Metrics for Query 5: Count: 5 times executed in whole run AQET: 0.087542 seconds (arithmetic mean) AQET(geom.): 0.087327 seconds (geometric mean) QPS: 11.42 Queries per second minQET/maxQET: 0.08165600s / 0.09889200s Average result count: 5.0 min/max result count: 5 / 5 Metrics for Query 6: Count: 5 times executed in whole run AQET: 0.131222 seconds (arithmetic mean) AQET(geom.): 0.131216 seconds (geometric mean) QPS: 7.62 Queries per second minQET/maxQET: 0.12924200s / 0.13298200s Average result count: 3.6 min/max result count: 3 / 5 Metrics for Query 7: Count: 20 times executed in whole run AQET: 0.043601 seconds (arithmetic mean) AQET(geom.): 0.040890 seconds (geometric mean) QPS: 22.94 Queries per second minQET/maxQET: 0.01984400s / 0.06012600s Average result count: 26.4 min/max result count: 5 / 96 Metrics for Query 8: Count: 10 times executed in whole run AQET: 0.018168 seconds (arithmetic mean) AQET(geom.): 0.016205 seconds (geometric mean) QPS: 55.04 Queries per second minQET/maxQET: 0.01097600s / 0.05066900s Average result count: 12.8 min/max result count: 6 / 20 Metrics for Query 9: Count: 20 times executed in whole run AQET: 0.043813 seconds (arithmetic mean) AQET(geom.): 0.043807 seconds (geometric mean) QPS: 22.82 Queries per second minQET/maxQET: 0.04274900s / 0.04504100s Average result count: 0.0 min/max result count: 0 / 0 Metrics for Query 10: Count: 15 times executed in whole run AQET: 0.030697 seconds (arithmetic mean) AQET(geom.): 0.029651 seconds (geometric mean) QPS: 32.58 Queries per second minQET/maxQET: 0.02072000s / 0.03975700s Average result count: 1.1 min/max result count: 0 / 4 real 0 m 5.485 s user 0 m 2.233 s sys 0 m 0.170 s Of the approximately 5.5 seconds of running five query mixes, the test driver spends 2.2 s. The server side processing time is 3.1 s, of which SQL compilation is 1.35 s. The rest is miscellaneous system time. The measurement is on 64-bit Linux, 2GHz dual-Xeon 5130 (8 cores) with 8G RAM. We note that this type of workload would be done with stored procedures or prepared, parameterized queries in the SQL world. There will be some further tuning still but this addresses the bulk of the matter. There will be a separate message about the patch containing these improvements.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div>
<div style="display:none;">Virtuoso Optimizations for the Berlin SPARQL Benchmark </div>
<p>We had a look at Chris Bizer&#39;s initial results with the <a href="http://www4.wiwiss.fu-berlin.de/bizer/BerlinSPARQLBenchmark/spec/index.html" id="link-id105c9f78">Berlin SPARQL Benchmark</a> (<a href="http://www4.wiwiss.fu-berlin.de/bizer/BerlinSPARQLBenchmark/spec/index.html" id="link-id102d62b0">BSBM</a>) on <a href="http://virtuoso.openlinksw.com" id="link-id13eb9780">Virtuoso</a>.  The first results were rather bad, as nearly all of the run time was spent optimizing the <a href="http://dbpedia.org/resource/SPARQL" id="link-id14a51258">SPARQL</a> statements and under 10% actually running them.</p>
<p>So I spent a couple of days on the <a href="http://dbpedia.org/resource/SPARQL" id="link-id0xaad28d0">SPARQL</a>/<a href="http://dbpedia.org/resource/SQL" id="link-id108745b0">SQL</a> compiler, to the effect of making it do a better guess of initial execution plan and streamlining some operations.  In fact, many of the queries in <a href="http://www4.wiwiss.fu-berlin.de/bizer/BerlinSPARQLBenchmark/spec/index.html" id="link-id0xaa230b8">BSBM</a> are not particularly sensitive to execution plan, as they access a very small portion of the database.  So to close the matter, I put in a flag that makes the <a href="http://dbpedia.org/resource/SQL" id="link-id0x1e9e8e28">SQL</a> compiler give up on devising new plans if the time of the best plan so far is less than the time spent compiling so far.</p>
<p>With these changes, available now as a diff on top of 5.0.7, we run quite well, several times better than initially.  With the compiler time cut-off in place (ini parameter <code>StopCompilerWhenXOverRunTime = 1</code>), we get the following times, output from the BSBM test driver:</p>
<blockquote>
<pre>
Starting test...

0: 1031.22 ms, total: 1151 ms
1:  982.89 ms, total: 1040 ms
2:  923.27 ms, total:  968 ms
3:  898.37 ms, total:  932 ms
4:  855.70 ms, total:  865 ms

Scale factor:               10000
Number of query mix runs:   5 times
min/max Query mix runtime:  0.8557 s / 1.0312 s
Total runtime:              4.691 seconds
QMpH:                       3836.77 query mixes per hour
CQET:                       0.93829 seconds average runtime 
                                       of query mix
CQET (geom.):               0.93625 seconds geometric mean 
                                       runtime of query mix

Metrics for Query 1:
   Count:                 5 times executed in whole run
   AQET:                  0.012212 seconds (arithmetic mean)
   AQET(geom.):           0.009934 seconds (geometric mean)
   QPS:                   81.89 Queries per second
   minQET/maxQET:         0.00684000s / 0.03115700s
   Average result count:  7.0
   min/max result count:  3 / 10

Metrics for Query 2:
   Count:                 35 times executed in whole run
   AQET:                  0.030490 seconds (arithmetic mean)
   AQET(geom.):           0.029776 seconds (geometric mean)
   QPS:                   32.80 Queries per second
   minQET/maxQET:         0.02467300s / 0.06753000s
   Average result count:  22.5
   min/max result count:  15 / 30

Metrics for Query 3:
   Count:                 5 times executed in whole run
   AQET:                  0.006947 seconds (arithmetic mean)
   AQET(geom.):           0.006905 seconds (geometric mean)
   QPS:                   143.95 Queries per second
   minQET/maxQET:         0.00580000s / 0.00795100s
   Average result count:  4.0
   min/max result count:  0 / 10

Metrics for Query 4:
   Count:                 5 times executed in whole run
   AQET:                  0.008858 seconds (arithmetic mean)
   AQET(geom.):           0.008829 seconds (geometric mean)
   QPS:                   112.89 Queries per second
   minQET/maxQET:         0.00804400s / 0.01019500s
   Average result count:  3.4
   min/max result count:  0 / 10

Metrics for Query 5:
   Count:                 5 times executed in whole run
   AQET:                  0.087542 seconds (arithmetic mean)
   AQET(geom.):           0.087327 seconds (geometric mean)
   QPS:                   11.42 Queries per second
   minQET/maxQET:         0.08165600s / 0.09889200s
   Average result count:  5.0
   min/max result count:  5 / 5

Metrics for Query 6:
   Count:                 5 times executed in whole run
   AQET:                  0.131222 seconds (arithmetic mean)
   AQET(geom.):           0.131216 seconds (geometric mean)
   QPS:                   7.62 Queries per second
   minQET/maxQET:         0.12924200s / 0.13298200s
   Average result count:  3.6
   min/max result count:  3 / 5

Metrics for Query 7:
   Count:                 20 times executed in whole run
   AQET:                  0.043601 seconds (arithmetic mean)
   AQET(geom.):           0.040890 seconds (geometric mean)
   QPS:                   22.94 Queries per second
   minQET/maxQET:         0.01984400s / 0.06012600s
   Average result count:  26.4
   min/max result count:  5 / 96

Metrics for Query 8:
   Count:                 10 times executed in whole run
   AQET:                  0.018168 seconds (arithmetic mean)
   AQET(geom.):           0.016205 seconds (geometric mean)
   QPS:                   55.04 Queries per second
   minQET/maxQET:         0.01097600s / 0.05066900s
   Average result count:  12.8
   min/max result count:  6 / 20

Metrics for Query 9:
   Count:                 20 times executed in whole run
   AQET:                  0.043813 seconds (arithmetic mean)
   AQET(geom.):           0.043807 seconds (geometric mean)
   QPS:                   22.82 Queries per second
   minQET/maxQET:         0.04274900s / 0.04504100s
   Average result count:  0.0
   min/max result count:  0 / 0

Metrics for Query 10:
   Count:                 15 times executed in whole run
   AQET:                  0.030697 seconds (arithmetic mean)
   AQET(geom.):           0.029651 seconds (geometric mean)
   QPS:                   32.58 Queries per second
   minQET/maxQET:         0.02072000s / 0.03975700s
   Average result count:  1.1
   min/max result count:  0 / 4

   real  0 m 5.485 s
   user  0 m 2.233 s
   sys   0 m 0.170 s
</pre></blockquote>
<p>Of the approximately 5.5 seconds of running five query mixes, the test driver spends 2.2 s.  The server side processing time is 3.1 s, of which SQL compilation is 1.35 s.  The rest is miscellaneous system time.  The measurement is on 64-bit Linux, 2GHz dual-Xeon 5130 (8 cores) with 8G RAM. </p>
<p>We note that this type of workload would be done with stored procedures or prepared, parameterized queries in the SQL world.</p>
<p>There will be some further tuning still but this addresses the bulk of the matter.  There will be a separate message about the patch containing these improvements.</p>
</div>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/weblog/oerling/?date=2008-07-30#1400">
  <rss:title>Virtuoso Optimizations for the Berlin SPARQL Benchmark </rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2008-07-30T18:17:54Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">We had a look at Chris Bizer&#39;s initial results with the Berlin SPARQL Benchmark (BSBM) on Virtuoso. The first results were rather bad, as nearly all of the run time was spent optimizing the SPARQL statements and under 10% actually running them. So I spent a couple of days on the SPARQL/SQL compiler, to the effect of making it do a better guess of initial execution plan and streamlining some operations. In fact, many of the queries in BSBM are not particularly sensitive to execution plan, as they access a very small portion of the database. So to close the matter, I put in a flag that makes the SQL compiler give up on devising new plans if the time of the best plan so far is less than the time spent compiling so far. With these changes, available now as a diff on top of 5.0.7, we run quite well, several times better than initially. With the compiler time cut-off in place (ini parameter StopCompilerWhenXOverRunTime = 1), we get the following times, output from the BSBM test driver: Starting test... 0: 1031.22 ms, total: 1151 ms 1: 982.89 ms, total: 1040 ms 2: 923.27 ms, total: 968 ms 3: 898.37 ms, total: 932 ms 4: 855.70 ms, total: 865 ms Scale factor: 10000 Number of query mix runs: 5 times min/max Query mix runtime: 0.8557 s / 1.0312 s Total runtime: 4.691 seconds QMpH: 3836.77 query mixes per hour CQET: 0.93829 seconds average runtime of query mix CQET (geom.): 0.93625 seconds geometric mean runtime of query mix Metrics for Query 1: Count: 5 times executed in whole run AQET: 0.012212 seconds (arithmetic mean) AQET(geom.): 0.009934 seconds (geometric mean) QPS: 81.89 Queries per second minQET/maxQET: 0.00684000s / 0.03115700s Average result count: 7.0 min/max result count: 3 / 10 Metrics for Query 2: Count: 35 times executed in whole run AQET: 0.030490 seconds (arithmetic mean) AQET(geom.): 0.029776 seconds (geometric mean) QPS: 32.80 Queries per second minQET/maxQET: 0.02467300s / 0.06753000s Average result count: 22.5 min/max result count: 15 / 30 Metrics for Query 3: Count: 5 times executed in whole run AQET: 0.006947 seconds (arithmetic mean) AQET(geom.): 0.006905 seconds (geometric mean) QPS: 143.95 Queries per second minQET/maxQET: 0.00580000s / 0.00795100s Average result count: 4.0 min/max result count: 0 / 10 Metrics for Query 4: Count: 5 times executed in whole run AQET: 0.008858 seconds (arithmetic mean) AQET(geom.): 0.008829 seconds (geometric mean) QPS: 112.89 Queries per second minQET/maxQET: 0.00804400s / 0.01019500s Average result count: 3.4 min/max result count: 0 / 10 Metrics for Query 5: Count: 5 times executed in whole run AQET: 0.087542 seconds (arithmetic mean) AQET(geom.): 0.087327 seconds (geometric mean) QPS: 11.42 Queries per second minQET/maxQET: 0.08165600s / 0.09889200s Average result count: 5.0 min/max result count: 5 / 5 Metrics for Query 6: Count: 5 times executed in whole run AQET: 0.131222 seconds (arithmetic mean) AQET(geom.): 0.131216 seconds (geometric mean) QPS: 7.62 Queries per second minQET/maxQET: 0.12924200s / 0.13298200s Average result count: 3.6 min/max result count: 3 / 5 Metrics for Query 7: Count: 20 times executed in whole run AQET: 0.043601 seconds (arithmetic mean) AQET(geom.): 0.040890 seconds (geometric mean) QPS: 22.94 Queries per second minQET/maxQET: 0.01984400s / 0.06012600s Average result count: 26.4 min/max result count: 5 / 96 Metrics for Query 8: Count: 10 times executed in whole run AQET: 0.018168 seconds (arithmetic mean) AQET(geom.): 0.016205 seconds (geometric mean) QPS: 55.04 Queries per second minQET/maxQET: 0.01097600s / 0.05066900s Average result count: 12.8 min/max result count: 6 / 20 Metrics for Query 9: Count: 20 times executed in whole run AQET: 0.043813 seconds (arithmetic mean) AQET(geom.): 0.043807 seconds (geometric mean) QPS: 22.82 Queries per second minQET/maxQET: 0.04274900s / 0.04504100s Average result count: 0.0 min/max result count: 0 / 0 Metrics for Query 10: Count: 15 times executed in whole run AQET: 0.030697 seconds (arithmetic mean) AQET(geom.): 0.029651 seconds (geometric mean) QPS: 32.58 Queries per second minQET/maxQET: 0.02072000s / 0.03975700s Average result count: 1.1 min/max result count: 0 / 4 real 0 m 5.485 s user 0 m 2.233 s sys 0 m 0.170 s Of the approximately 5.5 seconds of running five query mixes, the test driver spends 2.2 s. The server side processing time is 3.1 s, of which SQL compilation is 1.35 s. The rest is miscellaneous system time. The measurement is on 64-bit Linux, 2GHz dual-Xeon 5130 (8 cores) with 8G RAM. We note that this type of workload would be done with stored procedures or prepared, parameterized queries in the SQL world. There will be some further tuning still but this addresses the bulk of the matter. There will be a separate message about the patch containing these improvements.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p>We had a look at Chris Bizer&#39;s initial results with the <a href="http://www4.wiwiss.fu-berlin.de/bizer/BerlinSPARQLBenchmark/spec/index.html" id="link-id105c9f78">Berlin SPARQL Benchmark</a> (<a href="http://www4.wiwiss.fu-berlin.de/bizer/BerlinSPARQLBenchmark/spec/index.html" id="link-id102d62b0">BSBM</a>) on <a href="http://virtuoso.openlinksw.com" id="link-id13eb9780">Virtuoso</a>.  The first results were rather bad, as nearly all of the run time was spent optimizing the <a href="http://dbpedia.org/resource/SPARQL" id="link-id14a51258">SPARQL</a> statements and under 10% actually running them.</p>
<p>So I spent a couple of days on the <a href="http://dbpedia.org/resource/SPARQL" id="link-id0xa5a8d0e8">SPARQL</a>/<a href="http://dbpedia.org/resource/SQL" id="link-id108745b0">SQL</a> compiler, to the effect of making it do a better guess of initial execution plan and streamlining some operations.  In fact, many of the queries in <a href="http://www4.wiwiss.fu-berlin.de/bizer/BerlinSPARQLBenchmark/spec/index.html" id="link-id0xaf04af8">BSBM</a> are not particularly sensitive to execution plan, as they access a very small portion of the database.  So to close the matter, I put in a flag that makes the <a href="http://dbpedia.org/resource/SQL" id="link-id0x1e8d2360">SQL</a> compiler give up on devising new plans if the time of the best plan so far is less than the time spent compiling so far.</p>
<p>With these changes, available now as a diff on top of 5.0.7, we run quite well, several times better than initially.  With the compiler time cut-off in place (ini parameter <code>StopCompilerWhenXOverRunTime = 1</code>), we get the following times, output from the BSBM test driver:</p>
<blockquote>
<pre>
Starting test...

0: 1031.22 ms, total: 1151 ms
1:  982.89 ms, total: 1040 ms
2:  923.27 ms, total:  968 ms
3:  898.37 ms, total:  932 ms
4:  855.70 ms, total:  865 ms

Scale factor:               10000
Number of query mix runs:   5 times
min/max Query mix runtime:  0.8557 s / 1.0312 s
Total runtime:              4.691 seconds
QMpH:                       3836.77 query mixes per hour
CQET:                       0.93829 seconds average runtime 
                                       of query mix
CQET (geom.):               0.93625 seconds geometric mean 
                                       runtime of query mix

Metrics for Query 1:
   Count:                 5 times executed in whole run
   AQET:                  0.012212 seconds (arithmetic mean)
   AQET(geom.):           0.009934 seconds (geometric mean)
   QPS:                   81.89 Queries per second
   minQET/maxQET:         0.00684000s / 0.03115700s
   Average result count:  7.0
   min/max result count:  3 / 10

Metrics for Query 2:
   Count:                 35 times executed in whole run
   AQET:                  0.030490 seconds (arithmetic mean)
   AQET(geom.):           0.029776 seconds (geometric mean)
   QPS:                   32.80 Queries per second
   minQET/maxQET:         0.02467300s / 0.06753000s
   Average result count:  22.5
   min/max result count:  15 / 30

Metrics for Query 3:
   Count:                 5 times executed in whole run
   AQET:                  0.006947 seconds (arithmetic mean)
   AQET(geom.):           0.006905 seconds (geometric mean)
   QPS:                   143.95 Queries per second
   minQET/maxQET:         0.00580000s / 0.00795100s
   Average result count:  4.0
   min/max result count:  0 / 10

Metrics for Query 4:
   Count:                 5 times executed in whole run
   AQET:                  0.008858 seconds (arithmetic mean)
   AQET(geom.):           0.008829 seconds (geometric mean)
   QPS:                   112.89 Queries per second
   minQET/maxQET:         0.00804400s / 0.01019500s
   Average result count:  3.4
   min/max result count:  0 / 10

Metrics for Query 5:
   Count:                 5 times executed in whole run
   AQET:                  0.087542 seconds (arithmetic mean)
   AQET(geom.):           0.087327 seconds (geometric mean)
   QPS:                   11.42 Queries per second
   minQET/maxQET:         0.08165600s / 0.09889200s
   Average result count:  5.0
   min/max result count:  5 / 5

Metrics for Query 6:
   Count:                 5 times executed in whole run
   AQET:                  0.131222 seconds (arithmetic mean)
   AQET(geom.):           0.131216 seconds (geometric mean)
   QPS:                   7.62 Queries per second
   minQET/maxQET:         0.12924200s / 0.13298200s
   Average result count:  3.6
   min/max result count:  3 / 5

Metrics for Query 7:
   Count:                 20 times executed in whole run
   AQET:                  0.043601 seconds (arithmetic mean)
   AQET(geom.):           0.040890 seconds (geometric mean)
   QPS:                   22.94 Queries per second
   minQET/maxQET:         0.01984400s / 0.06012600s
   Average result count:  26.4
   min/max result count:  5 / 96

Metrics for Query 8:
   Count:                 10 times executed in whole run
   AQET:                  0.018168 seconds (arithmetic mean)
   AQET(geom.):           0.016205 seconds (geometric mean)
   QPS:                   55.04 Queries per second
   minQET/maxQET:         0.01097600s / 0.05066900s
   Average result count:  12.8
   min/max result count:  6 / 20

Metrics for Query 9:
   Count:                 20 times executed in whole run
   AQET:                  0.043813 seconds (arithmetic mean)
   AQET(geom.):           0.043807 seconds (geometric mean)
   QPS:                   22.82 Queries per second
   minQET/maxQET:         0.04274900s / 0.04504100s
   Average result count:  0.0
   min/max result count:  0 / 0

Metrics for Query 10:
   Count:                 15 times executed in whole run
   AQET:                  0.030697 seconds (arithmetic mean)
   AQET(geom.):           0.029651 seconds (geometric mean)
   QPS:                   32.58 Queries per second
   minQET/maxQET:         0.02072000s / 0.03975700s
   Average result count:  1.1
   min/max result count:  0 / 4

   real  0 m 5.485 s
   user  0 m 2.233 s
   sys   0 m 0.170 s
</pre></blockquote>
<p>Of the approximately 5.5 seconds of running five query mixes, the test driver spends 2.2 s.  The server side processing time is 3.1 s, of which SQL compilation is 1.35 s.  The rest is miscellaneous system time.  The measurement is on 64-bit Linux, 2GHz dual-Xeon 5130 (8 cores) with 8G RAM. </p>
<p>We note that this type of workload would be done with stored procedures or prepared, parameterized queries in the SQL world.</p>
<p>There will be some further tuning still but this addresses the bulk of the matter.  There will be a separate message about the patch containing these improvements.</p>
]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2007-09-22#1261">
  <rss:title>Fourth Platform: Data Spaces in The Cloud (Update)</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2007-09-22T23:43:00Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">I&#39;ve written extensively on the subject of Data Spaces in relation to the Data Web for while. I&#39;ve also written sparingly about OpenLink Data Spaces (a Data Web Platform that build using Virtuoso). On the other hand, I haven&#39;t shed much light on installation and deployment of OpenLink Data Spaces. Jon Udell recently penned a post titled: The Fourth Platform. The post arrives at a spookily coincidental time (this happens quite often between Jon and I as demonstrated last year during our podcast; the &quot;Fourth&quot; in his Innovators Podcast series). The platform that Jon describes is &quot;Cloud Based&quot; and comprised of Storage and Computation. I would like to add Data Access and Management (native and virtual) under the fourth platform banner with the end product called: &quot;Cloud based Data Spaces&quot;. As I write, we are releasing a Virtuoso AMI (Amazon Image) labeled: virtuoso-dataspace-server. This edition of Virtuoso includes the OpenLink Data Spaces Layer and all of the OAT applications we&#39;ve been developing for a while. What Benefits Does this offer? Personal Data Spaces in the Cloud - a place where you can control and consolidate data across your Blogs, Wikis, RSS/Atom Feed Subscriptions, Shared Bookmarks, Shared Calendars, Discussion Threads, Photo Galleries etc All the data in your Data Space is SPARQL or GData accessible. All of the data in your Personal Data Space is Linked Data from the get go. Each Item of data is URI addressable SIOC support - your Blogs, Wikis, Bookmarks etc.. are based on the SIOC ontology for Semantically Interlinking Online Communities (think: Open social-graph++) FOAF support - your FOAF Profile page provides a URI that is an in-road to all Data in your Data Space. OpenID support - your Personal Data Space ID is usable wherever OpenID is supported. OpenID and FOAF are integrated as per latest FOAF specs Two Integration with Facebook - You can access your Data Space from Facebook or access Facebook from your Data Space Unified Storage - The WebDAV based filesystem provides Cloud Storage that&#39;s integrated with Amazon S3; It also exposes all of your Data Space data via a traditional filesystem UI (think virtual Spotlight); You can also mount this drive to your local filesystem via your native operating system&#39;s WebDAV support SyncML - you can sync calendar and contact details with your Data Space in the cloud from your Mobile phone. A practical Semantic Data Web solution - based on Web Infrastructure and doesn&#39;t require you to do anything beyond exposing URIs for data in your Data Spaces. EC2-AMI Details: AMI ID: ami-e2ca2f8b Manifest file: virtuoso-images/virtuoso-dataspace-server.manifest.xml Installation Guide: Get an Amazon Web Services (AWS) account Signup for S3 and EC2 services Install the EC2 plugin for Firefox Start the EC2 plugin Locate the row containingÂ ami-7c31d515Â Â ManifestÂ virtuoso-test/virtuoso-cloud-beta-9-i386.manifest.xmlÂ (sort using the AMI ID or Manifest Columns or search on pattern: virtuoso, due to name flux) Start the Virtuoso Data Space Server AMI Wait 4-5 minutes (*take a few minutes to create the pre-configured Linux Image*) Connect to http://http://your-ec2-instance-cname:8890/ Log in with user/password dba/dba Go to the Admin UI (Virtuoso Conductor) and change the PWDs for the &#39;dba&#39; and &#39;dav&#39; accounts (*Important!*) Give the &quot;SPARQL&quot; user &quot;SPARQL_UPDATE&quot; privileges (required if you want to exploit the in-built Sponger Middleware) Click on the ODS (OpenLink Data Spaces) link to start an Personal Editon of OpenLink Data Spaces (or go to: http://your-ec2-instance-cname/dataspace/ods/index.html) Log-in using the username and password credentials for the &#39;dav&#39; account (or register a new user note: OpenID is an option here also) Create an Data Space Application Instance by clicking on a Data Space App. Tab Import data from your existing Web 2.0 style applications into OpenLink Data Spaces e.g. subscribe to a few RSS/Atom feeds via the &quot;Feeds Manager&quot; application or import some Bookmarks using the &quot;Bookmarks&quot; application Then look at the imported data in Linked Data form via your ODS generated URIs based on the patterns: http://your-ec2-instance-cname/dataspace/person/your-ods-id#this (URI for You the Person), http://your-ec2-instance-cname/dataspace/person/your-ods-id (FOAF File URI), http://your-ec2-instance-cname/dataspace/your-ods-id (SIOC File URI) (OAT) from your Data Space instanceInstall the OAT VAD package via the Admin UI and then apply the URI patterns below within your browser: http://:8890/oatdemo - Entire OAT Demo Collection http://:8890/rdfbrowser - RDF Browser http://:8890/isparql - SPARQL Query Builder (iSPARQL) http://:8890/qbe - SQL Query Builder (iSQL) http://:8890/formdesigner - Forms Builder (for building Meshups based on RDF, SQL, or Web Servives Data Souces) http://:8890/dbdesigner - SQL DB Schema Designer (note a Visual SQL-RDF Mapper is also on it&#39;s way http://:8890/DAV/JS/ - To view the OAT Tree (there are some experimental demos that are missing from the main demo app etc..) There&#39;s more to come!</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<p>I&#39;ve written extensively on the subject of <a href="http://www.openlinksw.com/weblog/public/search.vspx?blogid=127&amp;q=data%20spaces&amp;type=text&amp;output=html" id="link-id134c2280">Data Spaces</a> in relation to the <a href="http://www.openlinksw.com/weblog/public/search.vspx?blogid=127&amp;q=data%20web%0D%0A&amp;type=text&amp;output=html" id="link-id105aef90">Data Web</a> for while. I&#39;ve also written sparingly about <a href="http://virtuoso.openlinksw.com/wiki/main/Main/OdsIndex" id="link-id105bd100">OpenLink Data Spaces</a> (a Data Web Platform that build using Virtuoso). On the other hand, I haven&#39;t shed much light on installation and deployment of OpenLink Data Spaces.</p> <p> <a href="http://blog.jonudell.net" id="link-id14347f20">Jon Udell</a> recently penned a post titled: <a href="http://blog.jonudell.net/2007/09/21/the-fourth-platform/" id="link-id1439ed48">The Fourth Platform</a>. The post arrives at a spookily coincidental time (this happens quite often between Jon and I as demonstrated last year during our <a href="http://weblog.infoworld.com/udell/gems/ju_idehen.mp3" id="link-id107d17a8">podcast</a>; the &quot;Fourth&quot; in his Innovators Podcast series).</p> <p>The platform that Jon describes is &quot;Cloud Based&quot; and comprised of Storage and Computation. I would like to add Data Access and Management (native and virtual) under the fourth platform banner with the end product called: &quot;Cloud based Data Spaces&quot;. </p> <p>As I write, we are releasing a Virtuoso AMI (Amazon Image) labeled: virtuoso-dataspace-server. This edition of<a href="http://virtuoso.openlinksw.com" id="link-id13543210"> Virtuoso</a> includes the OpenLink Data Spaces Layer and all of the OAT applications we&#39;ve been developing for a while.</p> <h2>What Benefits Does this offer?</h2> <ol> <li>Personal Data Spaces in the Cloud - a place where you can control and consolidate data across your Blogs, Wikis, RSS/Atom Feed Subscriptions, Shared Bookmarks, Shared Calendars, Discussion Threads, Photo Galleries etc</li> <li>All the data in your Data <a href="http://en.wikipedia.org/wiki/Data_Spaces">Space</a> is <a href="http://dbpedia.org/resource/SPARQL" id="link-id1149a4f8">SPARQL</a> or <a href="http://dbpedia.org/resource/GData" id="link-id107a9f28">GData</a> accessible.</li> <li>All of the data in your Personal Data Space is <a href="http://dbpedia.org/resource/Linked_Data">Linked Data</a> from the get go. Each Item of data is <a href="http://dbpedia.org/resource/Uniform_Resource_Identifier">URI</a> addressable</li> <li> <a href="http://dbpedia.org/resource/SIOC" id="link-id104f4160">SIOC</a> support - your Blogs, Wikis, Bookmarks etc.. are based on the SIOC ontology for Semantically Interlinking Online Communities (think: Open social-graph++) </li> <li> <a href="http://dbpedia.org/resource/Friend_of_a_friend" id="link-id105beb78">FOAF</a> support - your FOAF Profile page provides a URI that is an in-road to all Data in your Data Space.</li> <li> <a href="http://dbpedia.org/resource/OpenID" id="link-id1144e138">OpenID</a> support - your Personal Data Space ID is usable wherever OpenID is supported. OpenID and FOAF are integrated as per latest FOAF specs</li> <li>Two Integration with Facebook - You can access your Data Space from Facebook or access Facebook from your Data Space</li> <li>Unified Storage - The WebDAV based filesystem provides Cloud Storage that&#39;s integrated with Amazon S3; It also exposes all of your Data Space data via a traditional filesystem UI (think virtual Spotlight); You can also mount this drive to your local filesystem via your native operating system&#39;s WebDAV support</li> <li> <a href="http://dbpedia.org/resource/SyncML" id="link-id11128f48">SyncML</a> - you can sync calendar and contact details with your Data Space in the cloud from your Mobile phone.</li> <li>A practical Semantic Data Web solution - based on Web Infrastructure and doesn&#39;t require you to do anything beyond exposing URIs for data in your Data Spaces.</li> </ol> <h2> <a href="http://dbpedia.org/resource/Amazon_Elastic_Compute_Cloud" id="link-id115d1920">EC2</a>-AMI Details:</h2> <ul>AMI ID: ami-e2ca2f8b</ul> <ul>Manifest file: virtuoso-images/virtuoso-dataspace-server.manifest.xml</ul> <h2>Installation Guide:</h2> <ol> <li>Get an Amazon Web Services (AWS) account</li> <li>Signup for S3 and EC2 services</li> <li>Install the EC2 plugin for Firefox</li> <li>Start the EC2 plugin</li> <li>Locate the row containingÂ <b>ami-7c31d515Â Â ManifestÂ virtuoso-test/virtuoso-cloud-beta-9-i386.manifest.xmlÂ </b>(sort using the AMI ID or Manifest Columns or search on pattern: virtuoso, due to name flux)</li> <li>Start the Virtuoso Data Space Server AMI</li> <li>Wait 4-5 minutes (*take a few minutes to create the pre-configured Linux Image*)</li> <li>Connect to http://<public_dns_name_of_your_instance>http://your-ec2-instance-cname:8890/ Log in with user/password dba/dba</public_dns_name_of_your_instance> </li> <li>Go to the Admin UI (Virtuoso Conductor) and change the PWDs for the &#39;dba&#39; and &#39;dav&#39; accounts (*Important!*)</li> <li>Give the &quot;SPARQL&quot; user &quot;SPARQL_UPDATE&quot; privileges (required if you want to exploit the in-built Sponger Middleware)</li> <li>Click on the <a href="http://dbpedia.org/resource/OpenLink_Data_Spaces">ODS</a> (OpenLink Data Spaces) link to start an Personal Editon of OpenLink Data Spaces (or go to: http://your-ec2-instance-cname/dataspace/ods/index.html)</li> <li>Log-in using the username and password credentials for the &#39;dav&#39; account (or register a new user note: OpenID is an option here also) Create an Data Space Application Instance by clicking on a Data Space App. Tab</li> <li>Import data from your existing Web 2.0 style applications into OpenLink Data Spaces e.g. subscribe to a few RSS/Atom feeds via the &quot;Feeds Manager&quot; application or import some Bookmarks using the &quot;Bookmarks&quot; application</li> <li>Then look at the imported data in Linked Data form via your ODS generated URIs based on the patterns: http://your-ec2-instance-cname/dataspace/person/your-ods-id#this (URI for You the Person), http://your-ec2-instance-cname/dataspace/person/your-ods-id (FOAF File URI), http://your-ec2-instance-cname/dataspace/your-ods-id (SIOC File URI)<br /> </li> </ol> <h2> (OAT) from your Data Space instance</h2>Install the OAT VAD package via the Admin UI and then apply the URI patterns below within your browser:<br /> <ol> <li>http://<public_dns_name_of_your_instance>:8890/oatdemo - Entire OAT Demo Collection</public_dns_name_of_your_instance> </li> <li>http://<public_dns_name_of_your_instance>:8890/rdfbrowser - RDF Browser</public_dns_name_of_your_instance> </li> <li>http://<public_dns_name_of_your_instance>:8890/isparql - SPARQL Query Builder (iSPARQL)</public_dns_name_of_your_instance> </li> <li>http://<public_dns_name_of_your_instance>:8890/qbe - SQL Query Builder (iSQL)</public_dns_name_of_your_instance> </li> <li>http://<public_dns_name_of_your_instance>:8890/formdesigner - Forms Builder (for building Meshups based on RDF, SQL, or Web Servives Data Souces)</public_dns_name_of_your_instance> </li> <li>http://<public_dns_name_of_your_instance>:8890/dbdesigner - SQL DB Schema Designer (note a Visual SQL-RDF Mapper is also on it&#39;s way</public_dns_name_of_your_instance> </li> <li>http://<public_dns_name_of_your_instance>:8890/DAV/JS/ - To view the OAT Tree (there are some experimental demos that are missing from the main demo app etc..) </public_dns_name_of_your_instance> </li> </ol> <p>There&#39;s more to come!</p>

]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2007-04-01#1175">
  <rss:title>Open Source and Open Data Movements</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2007-04-01T22:02:15Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Dare Obasanjo&#39;s post about the issue of Open Data (or Open Data Access), indicates that the &quot;Open Data&quot; issue is gradually beginning to resonate across a broader audience. From my perspective on things I prefer to align my articulation of the changes that are occurring across our industry (courtesy of the Internet Inflection) to the MVC pattern. Re. the Web Versions (or Dimensions of Interaction): Web 1.0 - (V)iewer (Interactive Web experienced via Browser) Web 2.0 - (C)ontroller Web (via Web Services API) Web 3.0 - (M)odel (via the RDF Data Model as the basis for an Open and Standards based Concrete Conceptual Data Model) The same applies to evolution of Openness: Early work by Sun and other early UNIX Vendors - (V)iewer (Interaction with the same OS across different hardware platforms) Open Source Movement - (C)ontroller (Open Access to Application Source Code ) Open Data - (M)odel (*where we are now* Freeing the Date from the Applications and Services while moving the application development focus to a Concrete Conceptual Data Model focus. The Data Web is a classic example.) In the (C)ontroller realm where the focal point is Application Logic, data access issues aren&#39;t obvious (*I recall my battles with Richard Stallman re. the appropriate Open Source License variant for iODBC during the embryonic years of database and data access technology on Linux*). Data is an enigma in this realm, unfortunately. This implies that &quot;Data Lock-in&quot; occurs deliberately, but in most cases, inadvertently when we make Application Logic the focal point of everything. Another example is Web 2.0 in which the norm (unfortunately) is to suck in your data, and then refuse to give you complete ownership over how it is used (including the fact that you may want to share it elsewhere). Open Data is a really big deal which is why the SWEO supported Linking Open Data Project is a very big deal. The good news is that this movement is gathering moment at an exponential rate :-)</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p>
<a href="http://www.25hoursaday.com/weblog/PermaLink.aspx?guid=69141977-7514-443d-800b-1f95c1ff8dbe">Dare Obasanjo&#39;s post about the issue of Open Data</a> (or Open Data Access), indicates that the &quot;<a href="http://en.wikipedia.org/wiki/Open_Data">Open Data</a>&quot; issue is gradually beginning to resonate across a broader audience.</p>
<p>From my perspective on things I prefer to align my articulation of the changes that are occurring across our industry (courtesy of the Internet Inflection) to the <a href="http://en.wikipedia.org/wiki/Model-view-controller">MVC pattern</a>.</p>

<p>Re. the Web Versions (or Dimensions of Interaction):</p>
<ul>
Web 1.0 - (V)iewer (Interactive Web experienced via Browser)
</ul>
<ul>
Web 2.0 - (C)ontroller Web (via Web Services API)
</ul>
<ul>
Web 3.0 - (M)odel (via the RDF Data Model as the basis for an Open and Standards based Concrete Conceptual Data Model)</ul>

<p>The same applies to evolution of Openness:</p>
<ul>
Early work by Sun and other early UNIX Vendors - (V)iewer (Interaction with the same OS across different hardware platforms)</ul>
<ul>Open Source Movement - (C)ontroller (Open Access to Application Source Code )</ul>
<ul>Open Data - (M)odel (*where we are now* Freeing the Date from the Applications and Services while moving the application development focus to a Concrete Conceptual Data Model focus. The Data Web is a classic example.)</ul>

<p>In the (C)ontroller realm where the focal point is Application Logic, data access issues aren&#39;t obvious (*I recall <a href="http://207.22.26.166/bytecols/1999-11-03.html">my battles with Richard Stallman re. the appropriate Open Source License variant for iODBC</a> during the embryonic years of database and data access technology on Linux*). Data is an enigma in this realm, unfortunately. This implies that &quot;Data Lock-in&quot; occurs deliberately, but in most cases, inadvertently when we make Application Logic the focal point of everything. Another example is Web 2.0 in which the norm (unfortunately) is to suck in your data, and then refuse to give you complete ownership over how it is used (including the fact that you may want to share it elsewhere).</p>


<a href="http://en.wikipedia.org/wiki/Open_Data">Open Data</a> is a really big deal which is why the <a href="http://www.w3.org/2001/sw/sweo/">SWEO</a> supported <a href="http://esw.w3.org/topic/SweoIG/TaskForces/CommunityProjects/LinkingOpenData">Linking Open Data Project</a> is a very big deal. The good news is that this movement is gathering moment at an exponential rate :-)]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/weblog/oerling/?date=2007-01-10#1116">
  <rss:title>Virtuoso 5.0 Preview</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2007-01-10T15:08:43Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">As previously said, we have a Virtuoso with brand new engine multithreading. It is now complete and passes its regular test suite. This is the basis for Virtuoso 5.0, to be available as the open source and commercial cuts as before. As one benchmark, we used the TPC-C test driver that has always been bundled with Virtuoso. We ran 100000 new orders worth of the TPC-C transaction mix first with one client and then with 4 clients, each client going to its own warehouse, so there was not much lock contention. We did this on a 4 core Intel, the working set in RAM. With the old one, 1 client took 1m43 and 4 clients took 3m47. With the new one, one client took 1m30 and 4 clients took 2m37. So, 400000 new orders in 2m37, for 152820 new orders per minute as opposed to 105720 per minute previously. Do not confuse with the official tpmC metric, that one involves a whole bunch of further rules. TPC-C has activity spread over a few different tables. With tests dealing with fewer tables, improvements in parallelism are far greater. Aside from better parallelism, we have other features. One of them is a change in the read committed isolation, so that we now return the previous committed state for uncommitted changed rows instead of waiting for the updating transaction to terminate. This is similar to what Oracle does for read committed. Also we now do log checkpoints without having to abort pending write transactions. When we have faster inserts, we actually see the RDF bulk loader run slower. This is really backwards. The reason is that while one thread parses, other threads insert and if the inserting threads are done they go to wait on a semaphore and this whole business of context switching absolutely kills performance. With slower inserts, the parser keeps ahead so there is less context switching, hence better overall throughput. I still do not get it how the OS can spend between 1.5 and 6 microseconds, several thousand instructions, deciding what to do next when there are only 3-4 eligible threads and all the rest is background which goes with a few dozen slices per second. Solaris is a little better than Linux at this but not dramatically so. Mac OS X is way worse. As said, we use Oracle 10G2 on the same platform (Linux FC5 64 bit) for sparring. It is really a very good piece of software. We have written the TPC C transactions in SQL/PL. What is surprising is that these procedures run amazingly slowly, even with a single client. Otherwise the Oracle engine is very fast. Well, as I recall, the official TPC C runs with Oracle use an OCI client and no stored procedures. Strange. While Virtuoso for example fills the initial TPC C state a little faster than Oracle, the procedures run 5-10 times slower with Oracle than with Virtuoso, all data in warm cache and a single client. While some parts of Oracle are really well optimized, all basic joins and aggregates etc, we are surprised at how they could have neglected such a central piece as the PL. Also, we have looked at transaction semantics. Serializable is mostly serializable with Oracle but does not always keep a steady count. Also it does not prevent inserts into a space that has been found empty by a serializable transaction. True, it will not show these inserts to the serializable transaction, so in this it follows the rules. Also, to make a read really repeatable, it seems that the read has to be FOR UPDATE. Otherwise one can not implement a reliable resource transaction, like changing the balance of an account. Anyway, the Virtuoso engine overhaul is now mostly complete. This is of course an open ended topic but the present batch is nearing completion. We have gone through as many as 3 implementations of hash joins, some things have yet to be finished there. Oracle has very good hash joins. The only way we could match that was to do it all in memory, dropping any persistent storage of the hash. This is of course OK if the hash is not very large and anyway hash joins go sour if the hash does not fit in working set. As next topics, we have more RDF and the LUBM benchmark to finish. Also we should revisit TPC-D. Databases are really quite complicated and extensive pieces of software. Much more so than the casual observer might think.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p>As <a href="http://www.openlinksw.com/dataspace/oerling/weblog/Orri%20Erling%27s%20Blog/1108" id="link-id10c66e68">previously said</a>, we have a <a href="http://virtuoso.openlinksw.com" id="link-id0x1a5caeb8">Virtuoso</a> with brand new engine multithreading. It is now complete and passes its regular test suite. This is the basis for Virtuoso 5.0, to be available as the open source and commercial cuts as before.</p>
<p>As one benchmark, we used the <a href="http://dbpedia.org/resource/TPC-C" id="link-id0x15f8cbd8">TPC-C</a> test driver that has always been bundled with Virtuoso. We ran 100000 new orders worth of the TPC-C transaction mix first with one client and then with 4 clients, each client going to its own warehouse, so there was not much lock contention. We did this on a 4 core Intel, the working set in RAM. With the old one, 1 client took 1m43 and 4 clients took 3m47. With the new one, one client took 1m30 and 4 clients took 2m37. So, 400000 new orders in 2m37, for 152820 new orders per minute as opposed to 105720 per minute previously. Do not confuse with the official tpmC metric, that one involves a whole bunch of further rules.</p>
<p>TPC-C has activity spread over a few different tables. With tests dealing with fewer tables, improvements in parallelism are far greater.</p>
<p>Aside from better parallelism, we have other features. One of them is a change in the read committed isolation, so that we now return the previous committed state for uncommitted changed rows instead of waiting for the updating transaction to terminate. This is similar to what <a href="http://dbpedia.org/resource/Oracle_Database" id="link-id0x18184c08">Oracle</a> does for read committed. Also we now do log checkpoints without having to abort pending write transactions.</p>
<p>When we have faster inserts, we actually see the <a href="http://dbpedia.org/resource/Resource_Description_Framework" id="link-id0xde6fca0">RDF</a> bulk loader run slower. This is really backwards. The reason is that while one thread parses, other threads insert and if the inserting threads are done they go to wait on a semaphore and this whole business of context switching absolutely kills performance. With slower inserts, the parser keeps ahead so there is less context switching, hence better overall throughput. I still do not get it how the OS can spend between 1.5 and 6 microseconds, several thousand instructions, deciding what to do next when there are only 3-4 eligible threads and all the rest is background which goes with a few dozen slices per second. Solaris is a little better than Linux at this but not dramatically so. Mac OS X is way worse.</p>
<p>As said, we use Oracle 10G2 on the same platform (Linux FC5 64 bit) for sparring. It is really a very good piece of software. We have written the TPC C transactions in <a href="http://dbpedia.org/resource/SQL" id="link-id0x15b33600">SQL</a>/PL. What is surprising is that these procedures run amazingly slowly, even with a single client. Otherwise the Oracle engine is very fast. Well, as I recall, the official TPC C runs with Oracle use an OCI client and no stored procedures. Strange. While Virtuoso for example fills the initial TPC C state a little faster than Oracle, the procedures run 5-10 times slower with Oracle than with Virtuoso, all <a href="http://dbpedia.org/resource/Data" id="link-id0xd9d1150">data</a> in warm cache and a single client. While some parts of Oracle are really well optimized, all basic joins and aggregates etc, we are surprised at how they could have neglected such a central piece as the PL.</p>
<p>Also, we have looked at transaction semantics. Serializable is mostly serializable with Oracle but does not always keep a steady count. Also it does not prevent inserts into a space that has been found empty by a serializable transaction. True, it will not show these inserts to the serializable transaction, so in this it follows the rules. Also, to make a read really repeatable, it seems that the read has to be FOR UPDATE. Otherwise one can not implement a reliable resource transaction, like changing the balance of an account.</p>
<p>Anyway, the Virtuoso engine overhaul is now mostly complete. This is of course an open ended topic but the present batch is nearing completion. We have gone through as many as 3 implementations of hash joins, some things have yet to be finished there. Oracle has very good hash joins. The only way we could match that was to do it all in memory, dropping any persistent storage of the hash. This is of course OK if the hash is not very large and anyway hash joins go sour if the hash does not fit in working set.</p>
<p>As next topics, we have more RDF and the LUBM benchmark to finish. Also we should revisit TPC-D.</p>
<p>Databases are really quite complicated and extensive pieces of software. Much more so than the casual observer might think.</p>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/vdb/blog/?date=2007-01-10#1117">
  <rss:title>Virtuoso 5.0 Preview</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2007-01-10T14:58:29Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Virtuoso 5.0 Preview As previously said, we have a Virtuoso with brand new engine multithreading. It is now complete and passes its regular test suite. This is the basis for Virtuoso 5.0, to be available as the open source and commercial cuts as before. As one benchmark, we used the TPC-C test driver that has always been bundled with Virtuoso. We ran 100000 new orders worth of the TPC-C transaction mix first with one client and then with 4 clients, each client going to its own warehouse, so there was not much lock contention. We did this on a 4 core Intel, the working set in RAM. With the old one, 1 client took 1m43 and 4 clients took 3m47. With the new one, one client took 1m30 and 4 clients took 2m37. So, 400000 new orders in 2m37, for 152820 new orders per minute as opposed to 105720 per minute previously. Do not confuse with the official tpmC metric, that one involves a whole bunch of further rules. TPC-C has activity spread over a few different tables. With tests dealing with fewer tables, improvements in parallelism are far greater. Aside from better parallelism, we have other features. One of them is a change in the read committed isolation, so that we now return the previous committed state for uncommitted changed rows instead of waiting for the updating transaction to terminate. This is similar to what Oracle does for read committed. Also we now do log checkpoints without having to abort pending write transactions. When we have faster inserts, we actually see the RDF bulk loader run slower. This is really backwards. The reason is that while one thread parses, other threads insert and if the inserting threads are done they go to wait on a semaphore and this whole business of context switching absolutely kills performance. With slower inserts, the parser keeps ahead so there is less context switching, hence better overall throughput. I still do not get it how the OS can spend between 1.5 and 6 microseconds, several thousand instructions, deciding what to do next when there are only 3-4 eligible threads and all the rest is background which goes with a few dozen slices per second. Solaris is a little better than Linux at this but not dramatically so. Mac OS X is way worse. As said, we use Oracle 10G2 on the same platform (Linux FC5 64 bit) for sparring. It is really a very good piece of software. We have written the TPC C transactions in SQL/PL. What is surprising is that these procedures run amazingly slowly, even with a single client. Otherwise the Oracle engine is very fast. Well, as I recall, the official TPC C runs with Oracle use an OCI client and no stored procedures. Strange. While Virtuoso for example fills the initial TPC C state a little faster than Oracle, the procedures run 5-10 times slower with Oracle than with Virtuoso, all data in warm cache and a single client. While some parts of Oracle are really well optimized, all basic joins and aggregates etc, we are surprised at how they could have neglected such a central piece as the PL. Also, we have looked at transaction semantics. Serializable is mostly serializable with Oracle but does not always keep a steady count. Also it does not prevent inserts into a space that has been found empty by a serializable transaction. True, it will not show these inserts to the serializable transaction, so in this it follows the rules. Also, to make a read really repeatable, it seems that the read has to be FOR UPDATE. Otherwise one can not implement a reliable resource transaction, like changing the balance of an account. Anyway, the Virtuoso engine overhaul is now mostly complete. This is of course an open ended topic but the present batch is nearing completion. We have gone through as many as 3 implementations of hash joins, some things have yet to be finished there. Oracle has very good hash joins. The only way we could match that was to do it all in memory, dropping any persistent storage of the hash. This is of course OK if the hash is not very large and anyway hash joins go sour if the hash does not fit in working set. As next topics, we have more RDF and the LUBM benchmark to finish. Also we should revisit TPC-D. Databases are really quite complicated and extensive pieces of software. Much more so than the casual observer might think.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div>
<div style="display:none;">Virtuoso 5.0 Preview</div>
<p>As <a href="http://www.openlinksw.com/dataspace/oerling/weblog/Orri%20Erling%27s%20Blog/1108" id="link-id10c66e68">previously said</a>, we have a <a href="http://virtuoso.openlinksw.com" id="link-id0x15b8d948">Virtuoso</a> with brand new engine multithreading. It is now complete and passes its regular test suite. This is the basis for Virtuoso 5.0, to be available as the open source and commercial cuts as before.</p>
<p>As one benchmark, we used the <a href="http://dbpedia.org/resource/TPC-C" id="link-id0x15fc4380">TPC-C</a> test driver that has always been bundled with Virtuoso. We ran 100000 new orders worth of the TPC-C transaction mix first with one client and then with 4 clients, each client going to its own warehouse, so there was not much lock contention. We did this on a 4 core Intel, the working set in RAM. With the old one, 1 client took 1m43 and 4 clients took 3m47. With the new one, one client took 1m30 and 4 clients took 2m37. So, 400000 new orders in 2m37, for 152820 new orders per minute as opposed to 105720 per minute previously. Do not confuse with the official tpmC metric, that one involves a whole bunch of further rules.</p>
<p>TPC-C has activity spread over a few different tables. With tests dealing with fewer tables, improvements in parallelism are far greater.</p>
<p>Aside from better parallelism, we have other features. One of them is a change in the read committed isolation, so that we now return the previous committed state for uncommitted changed rows instead of waiting for the updating transaction to terminate. This is similar to what <a href="http://dbpedia.org/resource/Oracle_Database" id="link-id0xe8cc528">Oracle</a> does for read committed. Also we now do log checkpoints without having to abort pending write transactions.</p>
<p>When we have faster inserts, we actually see the <a href="http://dbpedia.org/resource/Resource_Description_Framework" id="link-id0xe0e5ff8">RDF</a> bulk loader run slower. This is really backwards. The reason is that while one thread parses, other threads insert and if the inserting threads are done they go to wait on a semaphore and this whole business of context switching absolutely kills performance. With slower inserts, the parser keeps ahead so there is less context switching, hence better overall throughput. I still do not get it how the OS can spend between 1.5 and 6 microseconds, several thousand instructions, deciding what to do next when there are only 3-4 eligible threads and all the rest is background which goes with a few dozen slices per second. Solaris is a little better than Linux at this but not dramatically so. Mac OS X is way worse.</p>
<p>As said, we use Oracle 10G2 on the same platform (Linux FC5 64 bit) for sparring. It is really a very good piece of software. We have written the TPC C transactions in <a href="http://dbpedia.org/resource/SQL" id="link-id0x183aac30">SQL</a>/PL. What is surprising is that these procedures run amazingly slowly, even with a single client. Otherwise the Oracle engine is very fast. Well, as I recall, the official TPC C runs with Oracle use an OCI client and no stored procedures. Strange. While Virtuoso for example fills the initial TPC C state a little faster than Oracle, the procedures run 5-10 times slower with Oracle than with Virtuoso, all <a href="http://dbpedia.org/resource/Data" id="link-id0x1659fd20">data</a> in warm cache and a single client. While some parts of Oracle are really well optimized, all basic joins and aggregates etc, we are surprised at how they could have neglected such a central piece as the PL.</p>
<p>Also, we have looked at transaction semantics. Serializable is mostly serializable with Oracle but does not always keep a steady count. Also it does not prevent inserts into a space that has been found empty by a serializable transaction. True, it will not show these inserts to the serializable transaction, so in this it follows the rules. Also, to make a read really repeatable, it seems that the read has to be FOR UPDATE. Otherwise one can not implement a reliable resource transaction, like changing the balance of an account.</p>
<p>Anyway, the Virtuoso engine overhaul is now mostly complete. This is of course an open ended topic but the present batch is nearing completion. We have gone through as many as 3 implementations of hash joins, some things have yet to be finished there. Oracle has very good hash joins. The only way we could match that was to do it all in memory, dropping any persistent storage of the hash. This is of course OK if the hash is not very large and anyway hash joins go sour if the hash does not fit in working set.</p>
<p>As next topics, we have more RDF and the LUBM benchmark to finish. Also we should revisit TPC-D.</p>
<p>Databases are really quite complicated and extensive pieces of software. Much more so than the casual observer might think.</p>
</div>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/vdb/blog/?date=2007-01-09#1110">
  <rss:title>Virtuoso TPCC and Multiprocessor Linux and Mac</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2007-01-09T06:35:06Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Virtuoso TPCC and Multiprocessor Linux and Mac We have updated our article on Virtuoso scalability with two new platforms: A 2 x dual core Intel Xeon and a Mac Mini with an Intel Core Duo. We have more than quadrupled the best result so far. The best score so far is 83K transactions per minute with a 40 warehouse (about 4G) database. This is attributable to the process running in mostly memory, with 3 out of 4 cores busy on the database server. But even when doubling the database size and number of 3 clients, we stay at 49K transactions per minute, now with a little under 2 cores busy and am average of 20 disk reads pending at all times, split over 4 SATA disks. The measurement is the count of completed transactions during a 1h run. With the 80 warehouse database, it took about 18 minutes for the system to reach steady state, with a warm working set, hence the actual steady rate is somewhat higher than 49K, as the warm up period was included in the measurement. The metric on the Mac Mini was 2.7K with 2G RAM and one disk. The CPU usage was about one third of one core. Since we have had rates of over 10K with 2G RAM, we attribute the low result to running on a single disk which is not very fast at that. We have run tests in 64 and 32 bit modes but have found little difference as long as actual memory does not exceed 4g. If anything, 32 bit binaries should have an advantage in cache hit rate since most data structures take less space there. After the process size exceeds the 32 bit limit, there is a notable difference in favor of 64 bit. Having more than 4G of database buffers produces a marked advantage over letting the OS use the space for file system cache. So, 64 bit is worthwhile but only if there is enough memory. As for X86 having more registers in 64 bit mode, we have not specifically measured what effect that might have. We also note that Linux has improved a great deal with respect to multiprocessor configurations. We use a very simple test with a number of threads acquiring and then immediately freeing the same mutex. On single CPU systems, the real time has pretty much increased linearly with the number of threads. On multiprocessor systems, we used to get very non-linear behavior, with 2 threads competing for the same mutex taking tens of times the real time as opposed to one thread. At last measurement, with a 64 bit FC 5, we saw 2 threads take 7x the real time when competing for the same mutex. This is in the same ballpark as Solaris 10 on a similar system. Mac OS X 10.4 Tiger on a 2x dual core Xeon Mac Pro did the worst so far, with two threads taking over 70x the time of one. With a Mac Mini with a single Core Duo, the factor between one thread and two was 73. Also the proportion of system CPU on Tiger was consistently higher than on Solaris or Linux when running the same benchmarks. Of course for most applications this test is not significant but it is relevant for database servers, as there are many very short critical sections involved in multithreaded processing of indices and the like.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<div>
<div style="display:none;">Virtuoso TPCC and Multiprocessor Linux and Mac</div>
<p>We have <a href="http://virtuoso.openlinksw.com/wiki/main/Main/VOSScale" rel="sql" id="link-id10650ec0">updated our article</a> on <a href="http://virtuoso.openlinksw.com" id="link-id0xc41ba10">Virtuoso</a> scalability with two new platforms: A 2 x dual core Intel Xeon and a Mac Mini with an Intel Core Duo.</p>
<p>We have more than quadrupled the best result so far.</p>
<p>The best score so far is 83K transactions per minute with a 40 warehouse (about 4G) database. This is attributable to the process running in mostly memory, with 3 out of 4 cores busy on the database server. But even when doubling the database size and number of 3 clients, we stay at 49K transactions per minute, now with a little under 2 cores busy and am average of 20 disk reads pending at all times, split over 4 SATA disks. The measurement is the count of completed transactions during a 1h run. With the 80 warehouse database, it took about 18 minutes for the system to reach steady state, with a warm working set, hence the actual steady rate is somewhat higher than 49K, as the warm up period was included in the measurement.</p>
<p>The metric on the Mac Mini was 2.7K with 2G RAM and one disk. The CPU usage was about one third of one core. Since we have had rates of over 10K with 2G RAM, we attribute the low result to running on a single disk which is not very fast at that.</p>
<p>We have run tests in 64 and 32 bit modes but have found little difference as long as actual memory does not exceed 4g. If anything, 32 bit binaries should have an advantage in cache hit rate since most <a href="http://dbpedia.org/resource/Data" id="link-id0xdf23240">data</a> structures take less space there. After the process size exceeds the 32 bit limit, there is a notable difference in favor of 64 bit. Having more than 4G of database buffers produces a marked advantage over letting the OS use the space for file system cache. So, 64 bit is worthwhile but only if there is enough memory. As for X86 having more registers in 64 bit mode, we have not specifically measured what effect that might have.</p>
<p>We also note that Linux has improved a great deal with respect to multiprocessor configurations. We use a very simple test with a number of threads acquiring and then immediately freeing the same mutex. On single CPU systems, the real time has pretty much increased linearly with the number of threads. On multiprocessor systems, we used to get very non-linear behavior, with 2 threads competing for the same mutex taking tens of times the real time as opposed to one thread. At last measurement, with a 64 bit FC 5, we saw 2 threads take 7x the real time when competing for the same mutex. This is in the same ballpark as Solaris 10 on a similar system. Mac OS X 10.4 Tiger on a 2x dual core Xeon Mac Pro did the worst so far, with two threads taking over 70x the time of one. With a Mac Mini with a single Core Duo, the factor between one thread and two was 73.</p>
<p>Also the proportion of system CPU on Tiger was consistently higher than on Solaris or Linux when running the same benchmarks. Of course for most applications this test is not significant but it is relevant for database servers, as there are many very short critical sections involved in multithreaded processing of indices and the like.</p>
</div>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2006-09-26#1051">
  <rss:title>Virtuoso TPCC and Multiprocessor Linux and Mac</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2006-09-26T19:16:13Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">(Cut &amp; Pasted verbatim from Orri Erling&#39;s Weblog.) Virtuoso TPCC and Multiprocessor Linux and Mac: &quot; We have updated our article on Virtuoso scalability with two new platforms: A 2 x dual core Intel Xeon and a Mac Mini with an Intel Core Duo. We have more than quadrupled the best result so far. The best score so far is 83K transactions per minute with a 40 warehouse (about 4G) database. This is attributable to the process running in mostly memory, with 3 out of 4 cores busy on the database server. But even when doubling the database size and number of 3 clients, we stay at 49K transactions per minute, now with a little under 2 cores busy and am average of 20 disk reads pending at all times, split over 4 SATA disks. The measurement is the count of completed transactions during a 1h run. With the 80 warehouse database, it took about 18 minutes for the system to reach steady state, with a warm working set, hence the actual steady rate is somewhat higher than 49K, as the warm up period was included in the measurement. The metric on the Mac Mini was 2.7K with 2G RAM and one disk. The CPU usage was about one third of one core. Since we have had rates of over 10K with 2G RAM, we attribute the low result to running on a single disk which is not very fast at that. We have run tests in 64 and 32 bit modes but have found little difference as long as actual memory does not exceed 4g. If anything, 32 bit binaries should have an advantage in cache hit rate since most data structures take less space there. After the process size exceeds the 32 bit limit, there is a notable difference in favor of 64 bit. Having more than 4G of database buffers produces a marked advantage over letting the OS use the space for file system cache. So, 64 bit is worthwhile but only if there is enough memory. As for X86 having more registers in 64 bit mode, we have not specifically measured what effect that might have. We also note that Linux has improved a great deal with respect to multiprocessor configurations. We use a very simple test with a number of threads acquiring and then immediately freeing the same mutex. On single CPU systems, the real time has pretty much increased linearly with the number of threads. On multiprocessor systems, we used to get very non-linear behavior, with 2 threads competing for the same mutex taking tens of times the real time as opposed to one thread. At last measurement, with a 64 bit FC 5, we saw 2 threads take 7x the real time when competing for the same mutex. This is in the same ballpark as Solaris 10 on a similar system. Mac OS X 10.4 Tiger on a 2x dual core Xeon Mac Pro did the worst so far, with two threads taking over 70x the time of one. With a Mac Mini with a single Core Duo, the factor between one thread and two was 73. Also the proportion of system CPU on Tiger was consistently higher than on Solaris or Linux when running the same benchmarks. Of course for most applications this test is not significant but it is relevant for database servers, as there are many very short critical sections involved in multithreaded processing of indices and the like.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p>(Cut &amp; Pasted verbatim from <a href="http://www.openlinksw.com/weblog/oerling/">Orri Erling&#39;s Weblog</a>.)</p>

<p>
<a href="http://www.openlinksw.com/weblog/oerling/?id=1046">Virtuoso TPCC and Multiprocessor Linux and Mac</a>: &quot;</p>
<p>We have updated our <a href="http://virtuoso.openlinksw.com/wiki/main/Main/VOSScale" rel="sql">article on Virtuoso scalability</a> with two new platforms: A 2 x dual core Intel Xeon and a Mac Mini with an Intel Core Duo.</p>
<p>We have more than quadrupled the best result so far.</p>
<p>The best score so far is 83K transactions per minute with a 40 warehouse (about 4G) database. This is attributable to the process running in mostly memory, with 3 out of 4 cores busy on the database server. But even when doubling the database size and number of 3 clients, we stay at 49K transactions per minute, now with a little under 2 cores busy and am average of 20 disk reads pending at all times, split over 4 SATA disks. The measurement is the count of completed transactions during a 1h run. With the 80 warehouse database, it took about 18 minutes for the system to reach steady state, with a warm working set, hence the actual steady rate is somewhat higher than 49K, as the warm up period was included in the measurement.</p>
<p>The metric on the Mac Mini was 2.7K with 2G RAM and one disk. The CPU usage was about one third of one core. Since we have had rates of over 10K with 2G RAM, we attribute the low result to running on a single disk which is not very fast at that.</p>
<p>We have run tests in 64 and 32 bit modes but have found little difference as long as actual memory does not exceed 4g. If anything, 32 bit binaries should have an advantage in cache hit rate since most data structures take less space there. After the process size exceeds the 32 bit limit, there is a notable difference in favor of 64 bit. Having more than 4G of database buffers produces a marked advantage over letting the OS use the space for file system cache. So, 64 bit is worthwhile but only if there is enough memory. As for X86 having more registers in 64 bit mode, we have not specifically measured what effect that might have.</p>
<p>We also note that Linux has improved a great deal with respect to multiprocessor configurations. We use a very simple test with a number of threads acquiring and then immediately freeing the same mutex. On single CPU systems, the real time has pretty much increased linearly with the number of threads. On multiprocessor systems, we used to get very non-linear behavior, with 2 threads competing for the same mutex taking tens of times the real time as opposed to one thread. At last measurement, with a 64 bit FC 5, we saw 2 threads take 7x the real time when competing for the same mutex. This is in the same ballpark as Solaris 10 on a similar system. Mac OS X 10.4 Tiger on a 2x dual core Xeon Mac Pro did the worst so far, with two threads taking over 70x the time of one. With a Mac Mini with a single Core Duo, the factor between one thread and two was 73.</p>
<p>Also the proportion of system CPU on Tiger was consistently higher than on Solaris or Linux when running the same benchmarks. Of course for most applications this test is not significant but it is relevant for database servers, as there are many very short critical sections involved in multithreaded processing of indices and the like.</p>
]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/weblog/oerling/?date=2006-09-25#1112">
  <rss:title>Virtuoso TPCC and Multiprocessor Linux and Mac</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2006-09-25T11:13:22Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">We have updated our article on Virtuoso scalability with two new platforms: A 2 x dual core Intel Xeon and a Mac Mini with an Intel Core Duo. We have more than quadrupled the best result so far. The best score so far is 83K transactions per minute with a 40 warehouse (about 4G) database. This is attributable to the process running in mostly memory, with 3 out of 4 cores busy on the database server. But even when doubling the database size and number of 3 clients, we stay at 49K transactions per minute, now with a little under 2 cores busy and am average of 20 disk reads pending at all times, split over 4 SATA disks. The measurement is the count of completed transactions during a 1h run. With the 80 warehouse database, it took about 18 minutes for the system to reach steady state, with a warm working set, hence the actual steady rate is somewhat higher than 49K, as the warm up period was included in the measurement. The metric on the Mac Mini was 2.7K with 2G RAM and one disk. The CPU usage was about one third of one core. Since we have had rates of over 10K with 2G RAM, we attribute the low result to running on a single disk which is not very fast at that. We have run tests in 64 and 32 bit modes but have found little difference as long as actual memory does not exceed 4g. If anything, 32 bit binaries should have an advantage in cache hit rate since most data structures take less space there. After the process size exceeds the 32 bit limit, there is a notable difference in favor of 64 bit. Having more than 4G of database buffers produces a marked advantage over letting the OS use the space for file system cache. So, 64 bit is worthwhile but only if there is enough memory. As for X86 having more registers in 64 bit mode, we have not specifically measured what effect that might have. We also note that Linux has improved a great deal with respect to multiprocessor configurations. We use a very simple test with a number of threads acquiring and then immediately freeing the same mutex. On single CPU systems, the real time has pretty much increased linearly with the number of threads. On multiprocessor systems, we used to get very non-linear behavior, with 2 threads competing for the same mutex taking tens of times the real time as opposed to one thread. At last measurement, with a 64 bit FC 5, we saw 2 threads take 7x the real time when competing for the same mutex. This is in the same ballpark as Solaris 10 on a similar system. Mac OS X 10.4 Tiger on a 2x dual core Xeon Mac Pro did the worst so far, with two threads taking over 70x the time of one. With a Mac Mini with a single Core Duo, the factor between one thread and two was 73. Also the proportion of system CPU on Tiger was consistently higher than on Solaris or Linux when running the same benchmarks. Of course for most applications this test is not significant but it is relevant for database servers, as there are many very short critical sections involved in multithreaded processing of indices and the like.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p>We have <a href="http://virtuoso.openlinksw.com/wiki/main/Main/VOSScale" rel="sql" id="link-id10650ec0">updated our article</a> on <a href="http://virtuoso.openlinksw.com" id="link-id0x1aa2efc0">Virtuoso</a> scalability with two new platforms: A 2 x dual core Intel Xeon and a Mac Mini with an Intel Core Duo.</p>
<p>We have more than quadrupled the best result so far.</p>
<p>The best score so far is 83K transactions per minute with a 40 warehouse (about 4G) database. This is attributable to the process running in mostly memory, with 3 out of 4 cores busy on the database server. But even when doubling the database size and number of 3 clients, we stay at 49K transactions per minute, now with a little under 2 cores busy and am average of 20 disk reads pending at all times, split over 4 SATA disks. The measurement is the count of completed transactions during a 1h run. With the 80 warehouse database, it took about 18 minutes for the system to reach steady state, with a warm working set, hence the actual steady rate is somewhat higher than 49K, as the warm up period was included in the measurement.</p>
<p>The metric on the Mac Mini was 2.7K with 2G RAM and one disk. The CPU usage was about one third of one core. Since we have had rates of over 10K with 2G RAM, we attribute the low result to running on a single disk which is not very fast at that.</p>
<p>We have run tests in 64 and 32 bit modes but have found little difference as long as actual memory does not exceed 4g. If anything, 32 bit binaries should have an advantage in cache hit rate since most <a href="http://dbpedia.org/resource/Data" id="link-id0xa1cd02f8">data</a> structures take less space there. After the process size exceeds the 32 bit limit, there is a notable difference in favor of 64 bit. Having more than 4G of database buffers produces a marked advantage over letting the OS use the space for file system cache. So, 64 bit is worthwhile but only if there is enough memory. As for X86 having more registers in 64 bit mode, we have not specifically measured what effect that might have.</p>
<p>We also note that Linux has improved a great deal with respect to multiprocessor configurations. We use a very simple test with a number of threads acquiring and then immediately freeing the same mutex. On single CPU systems, the real time has pretty much increased linearly with the number of threads. On multiprocessor systems, we used to get very non-linear behavior, with 2 threads competing for the same mutex taking tens of times the real time as opposed to one thread. At last measurement, with a 64 bit FC 5, we saw 2 threads take 7x the real time when competing for the same mutex. This is in the same ballpark as Solaris 10 on a similar system. Mac OS X 10.4 Tiger on a 2x dual core Xeon Mac Pro did the worst so far, with two threads taking over 70x the time of one. With a Mac Mini with a single Core Duo, the factor between one thread and two was 73.</p>
<p>Also the proportion of system CPU on Tiger was consistently higher than on Solaris or Linux when running the same benchmarks. Of course for most applications this test is not significant but it is relevant for database servers, as there are many very short critical sections involved in multithreaded processing of indices and the like.</p>
]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2006-05-31#987">
  <rss:title>Great Product: Parallels Desktop Release Candidate 2 released</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2006-05-31T21:15:21Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">I am thoroughly impressed with this product. I have been using Solaris (in its many incarnations since the mid 80&#39;s SunOS days), Windows (since Windows 2.0), Linux (since inception), FreeBSD (since inception), and Mac OS X (since its NexT days). With the above in mind (years of getting into trouble during OS installation and usage etc.. I expected the very worst when attempting to get Solaris 10, Linux (Debian), FreeBSD 6.x, and Windows XP installed on a Mac Mini such that I could have all of these operating systems at my disposal without quad-booting. To my utter disbelief (I am still trying to recover from the immense euphoria..) Parallels delivered to me the absolute simplest installation and usage experience across all said operating systems that I have ever experienced. I now have a MacIntel Mac Mini (one of several that I will be stocking up on while I wait the Microsoft Universal Binary port of Office) that delivers me the long sought nirvana of having Solaris, FreeBSD, Linux, Windows XP, and Mac OS X on a single desktop! If you want to enjoy one of the genuine innovations of our time, simply make parallels an integral part of your Mac OS X experience (whether you are an end-user, developer, administrator, or systems integrator). Parallels Desktop Release Candidate 2, uh, released: &quot; Filed under: OS, Software Get your mice clicking ladies and gentlemen, as Parallels has offered up the final test version of Parallels Desktop for Mac, their virtualization software that allows you to run almost any OS right within Mac OS X. With this version, however, Parallels has increased the app&#39;s final price to $79.99, as they have incorporated their Compressor Server tool (due to user feedback) into the software package for streamlining and optimizing your virtual machines and the amount of disk space they occupy. The beta testing pre-order price of $39.99 is still in place, and probably more appetizing than ever. Other new features and improvements in the Release Candidate 2 include: Significantly improved performance Improved USB performance and broader device support Improved Host-guest networking Automatic network adapters now switch on-the-fly Guest OS no longer steals host IP address in some DHCP servers Fullscreen mode is now customizable Integration with Virtue is now bug-free Customizable Ctrl + Click mapping Guest 32bit color is supported when Parallels Tools is installed Improved Shared folders performance Resolved shared folders/MS Office incompatibility issues Windows 98 no longer consumes 99% host CPU even when idle (in VT-x mode) Also note that if you download this newest release, you must re-install the Parallels Tools for guest Windows installations (NT/2000/XP/2003). As with previous beta releases, this download is free before the software package goes official. Read&#39;|&#39;Permalink&#39;|&#39;Email this&#39;|&#39;Linking&#39;Blogs&#39;|&#39;Comments &quot; (Via The Unofficial Apple Weblog (TUAW).)</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p>I am thoroughly impressed with this product. I have been using Solaris (in its many incarnations since the mid 80&#39;s SunOS days), Windows (since Windows 2.0), Linux (since inception), FreeBSD (since inception), and Mac OS X (since its NexT days).</p>
<p>With the above in mind (years of getting into trouble during OS installation and usage etc.. I expected the very worst when attempting to get Solaris 10, Linux (Debian), FreeBSD 6.x, and Windows XP installed on a Mac Mini such that I could have all of these operating systems at my disposal without quad-booting. To my utter disbelief (I am still trying to recover from the immense euphoria..) Parallels delivered to me the absolute simplest installation and usage experience across all said operating systems that I have ever experienced.</p>
<p>I now have a MacIntel Mac Mini (one of several that I will be stocking up on while I wait the Microsoft Universal Binary port of Office) that delivers me the long sought nirvana of having Solaris, FreeBSD, Linux, Windows XP, and Mac OS X on a single desktop!</p>
<p>If you want to enjoy one of the genuine innovations of our time, simply make parallels an integral part of your Mac OS X experience (whether you are an end-user, developer, administrator, or systems integrator).</p>

<blockquote>
<p>
<a href="http://www.tuaw.com/2006/05/31/parallels-desktop-release-candidate-2-uh-released/#comments">Parallels Desktop Release Candidate 2, uh, released</a>: &quot;</p>
<p>Filed under: <a href="http://www.tuaw.com/category/os/" rel="tag">OS</a>, <a href="http://www.tuaw.com/category/software/" rel="tag">Software</a>
</p>
<div id="pc623643">
<img vspace="5" hspace="5" border="1" alt="" src="http://www.tuaw.com/media/2006/04/parrellsvirtualization.jpg" />
<br />Get your mice clicking ladies and gentlemen, as Parallels has offered up the final test version of Parallels Desktop for Mac, their virtualization software that allows you to run almost any OS right within Mac OS X. With this version, however, Parallels has increased the app&#39;s final price to $79.99, as they have incorporated their Compressor Server tool (due to user feedback) into the software package for streamlining and optimizing your virtual machines and the amount of disk space they occupy. The beta testing pre-order price of $39.99 is still in place, and probably more appetizing than ever. Other new features and improvements in the Release Candidate 2 include:<br />
<ul>
    <li>Significantly improved performance</li>
    <li>Improved USB performance and broader device support</li>
    <li>Improved Host-guest networking</li>
    <li>Automatic network adapters now switch on-the-fly</li>
    <li>Guest OS no longer steals host IP address in some DHCP servers</li>
    <li>Fullscreen mode is now customizable</li>
    <li>Integration with Virtue is now bug-free</li>
    <li>Customizable Ctrl + Click mapping</li>
    <li>Guest 32bit color is supported when Parallels Tools is installed</li>
    <li>Improved Shared folders performance</li>
    <li>Resolved shared folders/MS Office incompatibility issues</li>
    <li>Windows 98 no longer consumes 99% host CPU even when idle (in VT-x mode)</li>
</ul>
Also note that if you <a href="http://www.parallels.com/en/download/desktop/">download this newest release</a>, you must re-install the Parallels Tools for guest Windows installations (NT/2000/XP/2003). As with previous beta releases, this download is free before the software package goes official.</div>
<h6 style="clear: both; padding: 8px 0 0 0; height: 2px; font-size: 1px; border: 0; margin: 0; padding: 0;"></h6>
<a href="http://www.parallels.com/en/download/desktop/">Read</a>&#39;|&#39;<a href="http://www.tuaw.com/2006/05/31/parallels-desktop-release-candidate-2-uh-released/" rel="bookmark" title="Permanent link to this entry">Permalink</a>&#39;|&#39;<a href="http://www.tuaw.com/forward/623643/" title="Send this entry to a friend via email">Email this</a>&#39;|&#39;<a href="http://www.technorati.com/cosmos/search.html?rank=&fc=1&url=http://www.tuaw.com/2006/05/31/parallels-desktop-release-candidate-2-uh-released/" title="Linking Blogs">Linking&#39;Blogs</a>&#39;|&#39;<a href="http://www.tuaw.com/2006/05/31/parallels-desktop-release-candidate-2-uh-released/#comments" title="View reader comments on this entry">Comments</a>
<br />
<br />
<img src="http://feeds.tuaw.com/weblogsinc/tuaw?g=317" />&quot;

<p>(Via <a href="http://www.tuaw.com">The Unofficial Apple Weblog (TUAW)</a>.)</p>
</blockquote>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2006-05-05#968">
  <rss:title>&quot;Free&quot; Databases: Express vs. Open-Source RDBMSs</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2006-05-05T16:02:17Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Very detailed and insightful peek into the state of affairs re. database engines (Open &amp; Closed Source). I added the missing piece regarding the &quot;Virtuoso Conductor&quot; (the Web based Admin UI for Virtuoso) to the original post below. I also added a link to our live SPARQL Demo so that anyone interested can start playing around with SPARQL and SPARQL integrated into SQL right away. Another good thing about this post is the vast amount of valuable links that it contains. To really appreciate this point simply visit my Linkblog (excuse the current layout :-) - a Tab if you come in via the front door of this Data Space (what I used to call My Weblog Home Page). &quot;Free&quot; Databases: Express vs. Open-Source RDBMSs: &quot;Open-source relational database management systems (RDBMSs) are gaining IT mindshare at a rapid pace. As an example, BusinessWeek&#39;s February 6, 2006 &#39; Taking On the Database Giants &#39; article asks &#39;Can open-source upstarts compete with Oracle, IBM, and Microsoft?&#39; and then provides the answer: &#39;It&#39;s an uphill battle, but customers are starting to look at the alternatives.&#39; There&#39;s no shortage of open-source alternatives to look at. The BusinessWeek article concentrates on MySQL, which BW says &#39;is trying to be the Ikea of the database world: cheap, needs some assembly, but has a sleek, modern design and does the job.&#39; The article also discusses Postgre[SQL] and Ingres, as well as EnterpriseDB, an Oracle clone created from PostgreSQL code*. Sun includes PostgreSQL with Solaris 10 and, as of April 6, 2006, with Solaris Express.** *Frank Batten, Jr., the investor who originally funded Red Hat, invested a reported $16 million into Great Bridge with the hope of making a business out of providing paid support to PostgreSQL users. Great Bridge stayed in business only 18 months , having missed an opportunity to sell the business to Red Hat and finding that selling $50,000-per-year support packages for an open-source database wasn&#39;t easy. As Batten concluded, &#39;We could not get customers to pay us big dollars for support contracts.&#39; Perhaps EnterpriseDB will be more successful with a choice of $5,000, $3,000, or $1,000 annual support subscriptions . **Interestingly, Oracle announced in November 2005 that Solaris 10 is &#39;its preferred development and deployment platform for most x64 architectures, including x64 (x86, 64-bit) AMD Opteron and Intel Xeon processor-based systems and Sun&#39;s UltraSPARC(R)-based systems.&#39; There is a surfeit of reviews of current MySQL, PostgreSQL andâto a lesser extentâIngres implementations. These three open-source RDBMSs come with their own or third-party management tools. These systems compete against free versions of commercial (proprietary) databases: SQL Server 2005 Express Edition (and its MSDE 2000 and 1.0 predecessors), Oracle Database 10g Express Edition, IBM DB2 Express-C, and Sybase ASE Express Edition for Linux where database size and processor count limitations aren&#39;t important. Click here for a summary of recent InfoWorld reviews of the full versions of these four databases plus MySQL, which should be valid for Express editions also. The FTPOnline Special Report article, &#39;Microsoft SQL Server Turns 17,&#39; that contains the preceding table is here (requires registration.) SQL Server 2005 Express Edition SP-1 Advanced Features SQL Server 2005 Express Edition with Advanced Features enhances SQL Server 2005 Express Edition (SQL Express or SSX) dramatically, so it deserves special treatment here. SQL Express gains full text indexing and now supports SQL Server Reporting Services (SSRS) on the local SSX instance. The SP-1 with Advanced Features setup package, which Microsoft released on April 18, 2006, installs the release version of SQL Server Management Studio Express (SSMSE) and the full version of Business Intelligence Development Studio (BIDS) for designing and editing SSRS reports. My &#39;Install SP-1 for SQL Server 2005 and Express&#39; article for FTPOnline&#39;s SQL Server Special Report provides detailed, illustrated installation instructions for and related information about the release version of SP-1. SP-1 makes SSX the most capable of all currently available Express editions of commercial RDBMSs for Windows. OpenLink Software&#39;s Virtuoso Open-Source Edition OpenLink Software announced an open-source version of it&#39;s Virtuoso Universal Server commercial DBMS on April 11, 2006. On the initial date of this post, May 2, 2006, Virtuoso Open-Source Edition (VOS) was virtually under the radar as an open-source product. According to this press release, the new edition includes: SPARQL compliant RDF Triple Store SQL-200n Object-Relational Database Engine (SQL, XML, and Free Text) Integrated BPEL Server and Enterprise Service Bus WebDAV and Native File Server Web Application Server that supports PHP, Perl, Python, ASP.NET, JSP, etc. Runtime Hosting for Microsoft .NET, Mono, and Java VOS only lacks the virtual server and replication features that are offered by the commercial edition. VOS includes a Web-based administration tool called the &quot;Virtuoso Conductor&quot; According to Kingsley Idehen&#39;s Weblog, &#39;The Virtuoso build scripts have been successfully tested on Mac OS X (Universal Binary Target), Linux, FreeBSD, and Solaris (AIX, HP-UX, and True64 UNIX will follow soon). A Windows Visual Studio project file is also in the works (ETA some time this week).&#39; InfoWorld&#39;s Jon Udell has tracked Virtuoso&#39;s progress since 2002, with an additional article in 2003 and a one-hour podcast with Kingsley Idehen on April 26, 2006. A major talking point for Virtuoso is its support for Atom 0.3 syndication and publication, Atom 1.0 syndication and (forthcoming) publication, and future support for Google&#39;s GData protocol, as mentioned in this Idehen post. Yahoo!&#39;s Jeremy Zawodny points out that the &#39;fingerprints&#39; of Adam Bosworth, Google&#39;s VP of Engineering and the primary force behind the development of Microsoft Access, &#39;are all over GData.&#39; Click here to display a list of all OakLeaf posts that mention Adam Bosworth. One application for the GData protocol is querying and updating the Google Base database independently of the Google Web client, as mentioned by Jeremy: &#39;It&#39;s not about building an easier onramp to Google Base. ... Well, it is. But, again, that&#39;s the small stuff.&#39; Click here for a list of posts about my experiences with Google Base. Watch for a future OakLeaf post on the subject as the GData APIs gain ground. Open-Source and Free Embedded Database Contenders Open-source and free embedded SQL databases are gaining importance as the number and types of mobile devices and OSs proliferate. Embedded databases usually consist of Java classes or Windows DLLs that are designed to minimize file size and memory consumption. Embedded databases avoid the installation hassles, heavy resource usage and maintenance cost associated with client/server RDBMSs that run as an operating system service. Andrew Hudson&#39;s December 2005 &#39;Open Source databases rounded up and rodeoed&#39; review for The Enquirer provides brief descriptions of one commercial and eight open source database purveyors/products: Sleepycat, MySQL, PostgreSQL, Ingres, InnoBase, Firebird, IBM Cloudscape (a.k.a, Derby), Genezzo, and Oracle. Oracle Sleepycat* isn&#39;t an SQL Database, Oracle InnoDB* is an OEM database engine that&#39;s used by MySQL, and Genezzo is a multi-user, multi-server distributed database engine written in Perl. These special-purpose databases are beyond the scope of this post. * Oracle purchased Sleepycat Software, Inc. in February 2006 and purchased Innobase OY in October 2005 . The press release states: &#39;Oracle intends to continue developing the InnoDB technology and expand our commitment to open source software.&#39; Derby is an open-source release by the Apache Software Foundation of the Cloudscape Java-based database that IBM acquired when it bought Informix in 2001. IBM offers a commercial release of Derby as IBM Cloudscape 10.1. Derby is a Java class library that has a relatively light footprint (2 MB), which make it suitable for client/server synchronization with the IBM DB2 Everyplace Sync Server in mobile applications. The IBM DB2 Everyplace Express Edition isn&#39;t open source or free*, so it doesn&#39;t qualify for this post. The same is true for the corresponding Sybase SQL Anywhere components.** * IBM DB2 Everyplace Express Edition with synchronization costs $379 per server (up to two processors) and $79 per user. DB2 Everyplace Database Edition (without DB2 synchronization) is $49 per user. (Prices are based on those when IBM announced version 8 in November 2003.) ** Sybase&#39;s iAnywhere subsidiary calls SQL Anywhere &#39;the industry&#39;s leading mobile database.&#39; A Sybase SQL Anywhere Personal DB seat license with synchronization to SQL Anywhere Server is $119; the cost without synchronization wasn&#39;t available from the Sybase Web site. Sybase SQL Anywhere and IBM DB2 Everyplace perform similar replication functions. Sun&#39;s Java DB, another commercial version of Derby, comes with the Solaris Enterprise Edition, which bundles Solaris 10, the Java Enterprise System, developer tools, desktop infrastructure and N1 management software. A recent Between the Lines blog entry by ZDNet&#39;s David Berlind waxes enthusiastic over the use of Java DB embedded in a browser to provide offline persistence. RedMonk analyst James Governor and eWeek&#39;s Lisa Vaas wrote about the use of Java DB as a local data store when Tim Bray announced Sun&#39;s Derby derivative and Francois Orsini demonstrated Java DB embedded in the Firefox browser at the ApacheCon 2005 conference. Firebird is derived from Borland&#39;s InterBase 6.0 code, the first commercial relational database management system (RDBMS) to be released as open source. Firebird has excellent support for SQL-92 and comes in three versions: Classic, SuperServer and Embedded for Windows, Linux, Solaris, HP-UX, FreeBSD and MacOS X. The embedded version has a 1.4-MB footprint. Release Candidate 1 for Firebird 2.0 became available on March 30, 2006 and is a major improvement over earlier versions. Borland continues to promote InterBase, now at version 7.5, as a small-footprint, embedded database with commercial Server and Client licenses. SQLite is a featherweight C library for an embedded database that implements most SQL-92 entry- and transitional-level requirements (some through the JDBC driver) and supports transactions within a tiny 250-KB code footprint. Wrappers support a multitude of languages and operating systems, including Windows CE, SmartPhone, Windows Mobile, and Win32. SQLite&#39;s primary SQL-92 limitations are lack of nested transactions, inability to alter a table design once committed (other than with RENAME TABLE and ADD COLUMN operations), and foreign-key constraints. SQLite provides read-only views, triggers, and 256-bit encryption of database files. A downside is the the entire database file is locked when while a transaction is in progress. SQLite uses file access permissions in lieu of GRANT and REVOKE commands. Using SQLite involves no license; its code is entirely in the public domain. The Mozilla Foundation&#39;s Unified Storage wiki says this about SQLite: &#39;SQLite will be the back end for the unified store [for Firefox]. Because it implements a SQL engine, we get querying &#39;for free&#39;, without having to invent our own query language or query execution system. Its code-size footprint is moderate (250k), but it will hopefully simplify much existing code so that the net code-size change should be smaller. It has exceptional performance, and supports concurrent access to the database. Finally, it is released into the public domain, meaning that we will have no licensing issues.&#39; Vieka Technology, Inc.&#39;s eSQL 2.11 is a port of SQLite to Windows Mobile (Pocket PC and Smartphone) and Win32, and includes development tools for Windows devices and PCs, as well as a .NET native data provider. A conventional ODBC driver also is available. eSQL for Windows (Win32) is free for personal and commercial use; eSQL for Windows Mobile requires a license for commercial (for-profit or business) use. HSQLDB isn&#39;t on most reviewers&#39; radar, which is surprising because it&#39;s the default database for OpenOffice.org (OOo) 2.0&#39;s Base suite member. HSQLDB 1.8.0.1 is an open-source (BSD license) Java dembedded database engine based on Thomas Mueller&#39;s original Hypersonic SQL Project. Using OOo&#39;s Base feature requires installing the Java 2.0 Runtime Engine (which is not open-source) or the presence of an alternative open-source engine, such as Kaffe. My prior posts about OOo Base and HSQLDB are here, here and here. The HSQLDB 1.8.0 documentation on SourceForge states the following regarding SQL-92 and later conformance: HSQLDB 1.8.0 supports the dialect of SQL defined by SQL standards 92, 99 and 2003. This means where a feature of the standard is supported, e.g. left outer join, the syntax is that specified by the standard text. Many features of SQL92 and 99 up to Advanced Level are supported and here is support for most of SQL 2003 Foundation and several optional features of this standard. However, certain features of the Standards are not supported so no claim is made for full support of any level of the standards. Other less well-known embedded databases designed for or suited to mobile deployment are Mimer SQL Mobile and VistaDB 2.1 . Neither product is open-source and require paid licensing; VistaDB requires a small up-front payment by developers but offers royalty-free distribution. Java DB, Firebird embedded, SQLite and eSQL 2.11 are contenders for lightweight PC and mobile device database projects that aren&#39;t Windows-only. SQL Server 2005 Everywhere If you&#39;re a Windows developer, SQL Server Mobile is the logical embedded database choice for mobile applications for Pocket PCs and Smartphones. Microsoft&#39;s April 19, 2006 press release delivered the news that SQL Server 2005 Mobile Editon (SQL Mobile or SSM) would gain a big brotherâSQL Server 2005 Everywhere Edition. Currently, the SSM client is licensed (at no charge) to run in production on devices with Windows CE 5.0, Windows Mobile 2003 for Pocket PC or Windows Mobile 5.0, or on PCs with Windows XP Tablet Edition only. SSM also is licensed for development purposes on PCs running Visual Studio 2005. Smart Device replication with SQL Server 2000 SP3 and later databases has been the most common application so far for SSM. By the end of 2006, Microsoft will license SSE for use on all PCs running any Win32 version or the preceding device OSs. A version of SQL Server Management Studio Express (SSMSE)âupdated to support SSEâis expected to release by the end of the year. These features will qualify SSE as the universal embedded database for Windows client and smart-device applications. For more details on SSE, read John Galloway&#39;s April 11, 2006 blog post and my &#39;SQL Server 2005 Mobile Goes Everywhere&#39; article for the FTPOnline Special Report on SQL Server.&quot; (Via OakLeaf Systems.)</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
 <p>Very detailed and insightful peek into the state of affairs re. database engines (Open &amp; Closed Source).</p>   <p>I added the missing piece regarding the &quot;Virtuoso Conductor&quot; (the Web based Admin UI for Virtuoso) to the original post below. I also added a link to our live SPARQL Demo so that anyone interested can start playing around with SPARQL and SPARQL integrated into SQL right away.</p>  <p>Another good thing about this post is the vast amount of valuable links that it contains. To really appreciate this point simply visit my Linkblog (excuse the current layout :-) - a Tab if you come in via the front door of this <a href="http://www.infoworld.com/opinions/index.html">Data Space</a> (what I used to call <a href="http://www.openlinksw.com/blog/%7Ekidehen/">My Weblog Home Page</a>).</p>   <blockquote>  <p>   <a href="http://oakleafblog.blogspot.com/2006/05/free-databases-express-vs-open-source.html">&quot;Free&quot; Databases: Express vs. Open-Source RDBMSs</a>: &quot;<span style="font-family: verdana;">Open-source relational database management systems (RDBMSs) are gaining IT mindshare at a rapid pace. As an example, <em>BusinessWeek</em>&#39;s February 6, 2006 &#39;</span>   <a href="http://www.businessweek.com/technology/content/feb2006/tc20060206_918648.htm"><span style="font-family: verdana;">Taking On the Database Giants</span>   </a><span style="font-family: verdana;">&#39; article asks &#39;Can open-source upstarts compete with Oracle, IBM, and Microsoft?&#39; and then provides the answer: &#39;It&#39;s an uphill battle, but customers are starting to look at the alternatives.&#39;</span>   <br />   <span style="font-family: Verdana;"></span>   <br />   <span style="font-family: Verdana;">There&#39;s no shortage of open-source alternatives to look at. The <em>BusinessWeek</em> article concentrates on <a href="http://www.mysql.com/">MySQL</a>, which <em>BW</em> says &#39;is trying to be the Ikea of the database world: cheap, needs some assembly, but has a sleek, modern design and does the job.&#39; The article also discusses <a href="http://www.postgresql.org/">Postgre[SQL]</a> and <a href="http://www.ingres.com/products/Prod_Ingres_2006.html">Ingres</a>, as well as <a href="http://www.enterprisedb.com/">EnterpriseDB</a>, an Oracle clone created from PostgreSQL code*. Sun includes <a href="http://www.sun.com/software/solaris/postgres.jsp">PostgreSQL with Solaris 10</a> and, as of April 6, 2006, with <a href="http://docs.sun.com/app/docs/doc/819-2183/6n4g726uc?a=view">Solaris Express</a>.**</span>   <br />   <span style="font-family: Verdana;"></span>   <br />   <span style="font-family: Verdana;"><span style="font-size: 85%;">*Frank Batten, Jr., the investor who originally funded Red Hat, invested a reported </span>    <a href="http://www.theinquirer.net/?article=28201"><span style="font-size: 85%;">$16 million into Great Bridge</span>    </a><span style="font-size: 85%;"> with the hope of making a business out of providing paid support to PostgreSQL users. </span>    <a href="http://news.com.com/2100-1001-272715.html"><span style="font-size: 85%;">Great Bridge stayed in business only 18 months</span>    </a><span style="font-size: 85%;">, having </span>    <a href="http://news.com.com/2100-1001-268915.html"><span style="font-size: 85%;">missed an opportunity to sell the business to Red Hat</span>    </a><span style="font-size: 85%;"> and finding that selling </span>    <a href="http://news.com.com/2100-1001-269729.html"><span style="font-size: 85%;">$50,000-per-year support packages</span>    </a><span style="font-size: 85%;"> for an open-source database wasn&#39;t easy. As Batten concluded, &#39;We could not get customers to pay us big dollars for support contracts.&#39; Perhaps EnterpriseDB will be more successful with a choice of </span>    <a href="http://www.enterprisedb.com/shop.do?cID=10000&pID=10001"><span style="font-size: 85%;">$5,000, $3,000, or $1,000 annual support subscriptions</span>    </a><span style="font-size: 85%;">.</span>   </span>   <br />   <span style="font-family: Verdana;"></span><span style="font-family: Verdana;"></span><span style="font-family: Verdana;"></span>   <br />   <span style="font-family: Verdana; font-size: 85%;">**Interestingly, <a href="http://www.sun.com/smi/Press/sunflash/2005-11/sunflash.20051115.4.xml">Oracle announced in November 2005</a> that Solaris 10 is &#39;its preferred development and deployment platform for most x64 architectures, including x64 (x86, 64-bit) AMD Opteron and Intel Xeon processor-based systems and Sun&#39;s UltraSPARC(R)-based systems.&#39;</span>   <br />   <br />   <span style="font-family: Verdana;">There is a surfeit of reviews of current MySQL, PostgreSQL andâto a lesser extentâIngres implementations. These three open-source RDBMSs come with their own or third-party management tools. These systems compete against free versions of commercial (proprietary) databases: <a href="http://msdn.microsoft.com/vstudio/express/sql/">SQL Server 2005 Express Edition</a> (and its MSDE 2000 and 1.0 predecessors), <a href="http://www.oracle.com/technology/products/database/xe/index.html" target="_blank">Oracle Database 10g Express Edition</a>, <a href="http://www-306.ibm.com/software/data/db2/udb/db2express/download.html" target="_blank">IBM DB2 Express-C</a>, and <a href="http://www.sybase.com/linux_promo" target="_blank">Sybase ASE Express Edition for Linux</a> where database size and processor count limitations aren&#39;t important. Click <a href="http://www.ftponline.com/special/sqlserver/rjennings-overview/table4.aspx">here</a> for a summary of recent <em>InfoWorld</em> reviews of the full versions of these four databases plus MySQL, which should be valid for Express editions also. The <a href="http://www.ftponline.com/special/sqlserver/">FTPOnline Special Report</a> article, &#39;Microsoft SQL Server Turns 17,&#39; that contains the preceding table is <a href="http://www.ftponline.com/special/sqlserver/rjennings-overview/">here</a> (requires registration.)</span>   <br />   <br />  </p>  <p>   <strong><span style="font-family: verdana;">SQL Server 2005 Express Edition SP-1 Advanced Features</span>   </strong>  </p>  <p>   <span style="font-family: Verdana;"><a href="http://www.microsoft.com/downloads/details.aspx?familyid=4C6BA9FD-319A-4887-BC75-3B02B5E48A40&displaylang=en">SQL Server 2005 Express Edition with Advanced Features</a> enhances SQL Server 2005 Express Edition (SQL Express or SSX) dramatically, so it deserves special treatment here. SQL Express gains full text indexing and now supports SQL Server Reporting Services (SSRS) on the local SSX instance. The SP-1 with Advanced Features setup package, which Microsoft released on April 18, 2006, installs the release version of SQL Server Management Studio Express (SSMSE) and the full version of Business Intelligence Development Studio (BIDS) for designing and editing SSRS reports. My &#39;<a href="http://www.ftponline.com/special/sqlserver/rjennings-sp1/">Install SP-1 for SQL Server 2005 and Express</a>&#39; article for FTPOnline&#39;s <a href="http://www.ftponline.com/special/sqlserver/">SQL Server Special Report</a> provides detailed, illustrated installation instructions for and related information about the release version of SP-1. SP-1 makes SSX the most capable of all currently available Express editions of commercial RDBMSs for Windows.</span>  </p>  <p>   <strong><span style="font-family: verdana;">OpenLink Software&#39;s Virtuoso Open-Source Edition</span>   </strong>   <br />   <span style="font-family: verdana;"></span>   <br />   <span style="font-family: verdana;"><a href="http://openlinksw.com/">OpenLink Software</a> announced an <a href="http://virtuoso.openlinksw.com/wiki/main/Main/">open-source version</a> of it&#39;s <a href="http://virtuoso.openlinksw.com/">Virtuoso Universal Server</a> commercial DBMS on April 11, 2006. On the initial date of this post, May 2, 2006, Virtuoso Open-Source Edition (VOS) was virtually under the radar as an open-source product. According to <a href="http://www.openlinksw.com/press/VOSPressRelease.htm">this press release</a>, the new edition includes:</span> <span style="font-family: Verdana;"></span>  </p>  <blockquote>   <span style="font-family: Verdana;"></span>  </blockquote> <blockquote></blockquote> <blockquote></blockquote>  <ul>   <li>     <a href="http://demo.openlinksw.com/sparql_demo/">SPARQL compliant RDF Triple Store</a> </li>   <li>SQL-200n Object-Relational Database Engine (SQL, XML, and Free Text) </li>   <li>Integrated BPEL Server and Enterprise Service Bus</li>   <li>WebDAV and Native File Server </li>   <li>Web Application Server that supports PHP, Perl, Python, ASP.NET, JSP, etc. </li>   <li>Runtime Hosting for Microsoft .NET, Mono, and Java </li>  </ul>VOS only lacks the virtual server and replication features that are offered by the commercial edition. VOS includes a Web-based administration tool called the &quot;Virtuoso Conductor&quot; According to <a href="http://www.openlinksw.com/blog/%7Ekidehen/index.vspx?page=&id=951&sid=&realm=">Kingsley Idehen&#39;s Weblog</a>, &#39;The Virtuoso build scripts have been successfully tested on Mac OS X (Universal Binary Target), Linux, FreeBSD, and Solaris (AIX, HP-UX, and True64 UNIX will follow soon). A Windows Visual Studio project file is also in the works (ETA some time this week).&#39;<br /> <br /> <em>InfoWorld</em>&#39;s Jon Udell has tracked Virtuoso&#39;s progress since <a href="http://www.infoworld.com/article/02/04/12/020415plvirtuoso_1.html">2002</a>, with an <a href="http://www.infoworld.com/article/03/03/21/12virtuoso_1.html">additional article in 2003</a> and a <a href="http://weblog.infoworld.com/udell/2006/04/28.html#a1437">one-hour podcast with Kingsley Idehen</a> on April 26, 2006. A major talking point for Virtuoso is its support for Atom 0.3 syndication and publication, Atom 1.0 syndication and (forthcoming) publication, and future support for Google&#39;s <a href="http://code.google.com/apis/gdata/overview.html">GData protocol</a>, as mentioned in <a href="http://www.openlinksw.com/blog/%7Ekidehen/index.vspx?page=&id=965">this Idehen post</a>. Yahoo!&#39;s <a href="http://jeremy.zawodny.com/blog/archives/006687.html">Jeremy Zawodny</a> points out that the &#39;fingerprints&#39; of <a href="http://oakleafblog.blogspot.com/2005/11/adam-bosworth-learning-from-web-and.html">Adam Bosworth</a>, Google&#39;s VP of Engineering and the primary force behind the development of Microsoft Access, &#39;are all over GData.&#39; Click <a href="http://search.blogger.com/?as_q=bosworth&ie=UTF-8&ui=blg&amp;bl_url=oakleafblog.blogspot.com&x=50&y=10">here</a> to display a list of all OakLeaf posts that mention Adam Bosworth.<br /> <br />One application for the GData protocol is querying and updating the Google Base database independently of the Google Web client, as mentioned by Jeremy: &#39;It&#39;s not about building an easier onramp to Google Base. ... Well, it is. But, again, that&#39;s the small stuff.&#39; Click <a href="http://search.blogger.com/?as_q=%22google+base%22&ie=UTF-8&x=50&y=9&q=%22google+base%22+blogurl:oakleafblog.blogspot.com&filter=0&ui=blg&sa=N&start=0">here</a> for a list of posts about my experiences with Google Base. Watch for a future OakLeaf post on the subject as the GData APIs gain ground.<br /> <span style="font-family: Verdana;"></span> <br />  <span style="font-family: Verdana;"><strong>Open-Source and Free Embedded Database Contenders</strong>  </span> <br /> <span style="font-family: Verdana;"></span> <br /> <span style="font-family: Verdana;">Open-source and free embedded SQL databases are gaining importance as the number and types of mobile devices and OSs proliferate. Embedded databases usually consist of Java classes or Windows DLLs that are designed to minimize file size and memory consumption. Embedded databases avoid the installation hassles, heavy resource usage and maintenance cost associated with client/server RDBMSs that run as an operating system service.</span> <br /> <br /> <span style="font-family: Verdana;">Andrew Hudson&#39;s December 2005 &#39;<a href="http://www.theinquirer.net/?article=28201">Open Source databases rounded up and rodeoed</a>&#39; review for The Enquirer provides brief descriptions of one commercial and eight open source database purveyors/products: Sleepycat, MySQL, PostgreSQL, Ingres, InnoBase, Firebird, IBM Cloudscape (a.k.a, Derby), Genezzo, and Oracle. Oracle <a href="http://www.sleepycat.com/">Sleepycat</a>* isn&#39;t an SQL Database, Oracle <a href="http://www.innodb.com/index.php">InnoDB</a>* is an OEM database engine that&#39;s used by MySQL, and <a href="http://www.genezzo.com/">Genezzo</a> is a multi-user, multi-server distributed database engine written in Perl. These special-purpose databases are beyond the scope of this post.</span> <br /> <br />  <span style="font-family: Verdana;"><span style="font-size: 85%;">* Oracle <a href="http://www.oracle.com/sleepycat/index.html">purchased Sleepycat Software, Inc. in February 2006</a> and </span>   <a href="http://www.oracle.com/innodb/index.html"><span style="font-size: 85%;">purchased Innobase OY in October 2005</span>   </a><span style="font-size: 85%;">. The press release states: &#39;Oracle intends to continue developing the InnoDB technology and expand our commitment to open source software.&#39; </span>  </span> <br /> <span style="font-family: Verdana; font-size: 85%;"></span> <br /> <span style="font-family: Verdana;">   <a href="http://db.apache.org/derby/"><strong>Derby</strong>   </a> is an open-source release by the <a href="http://www.apache.org/">Apache Software Foundation</a> of the <a href="http://www.infoworld.com/article/04/08/03/HNcloudscape_1.html">Cloudscape Java-based database that IBM acquired</a> when it bought Informix in 2001. IBM offers a commercial release of Derby as <a href="http://www-128.ibm.com/developerworks/db2/library/techarticle/dm-0408cline/">IBM Cloudscape 10.1</a>. Derby is a Java class library that has a relatively light footprint (2 MB), which make it suitable for <a href="http://www-128.ibm.com/developerworks/db2/library/techarticle/dm-0503stumpf/">client/server synchronization</a> with the IBM DB2 Everyplace Sync Server in <a href="http://www-128.ibm.com/developerworks/library/wi-cloud/">mobile applications</a>. The IBM DB2 Everyplace Express Edition isn&#39;t open source or free*, so it doesn&#39;t qualify for this post. The same is true for the corresponding Sybase SQL Anywhere components.**</span> <br /> <br /> <br />  <p>   <span style="font-family: verdana; font-size: 85%;">* IBM DB2 Everyplace Express Edition with synchronization costs $379 per server (up to two processors) and $79 per user. DB2 Everyplace Database Edition (without DB2 synchronization) is $49 per user. (Prices are based on those when </span>   <a href="http://news.earthweb.com/wireless/article.php/3107101"><span style="font-family: verdana; font-size: 85%;">IBM announced version 8</span>   </a><span style="font-family: verdana; font-size: 85%;"> in November 2003.)</span>  </p>  <p>   <span style="font-family: verdana; font-size: 85%;">** Sybase&#39;s iAnywhere subsidiary calls SQL Anywhere &#39;the industry&#39;s leading mobile database.&#39; A Sybase SQL Anywhere Personal DB seat license with synchronization to SQL Anywhere Server is $119; the cost without synchronization wasn&#39;t available from the Sybase Web site. Sybase SQL Anywhere and IBM DB2 Everyplace perform similar replication functions.</span>  </p>  <p>   <span style="font-family: Verdana;">Sun&#39;s <a href="http://developers.sun.com/prodtech/javadb/"><strong>Java DB</strong></a>, another commercial version of Derby, comes with the <a href="http://www.sun.com/software/solaris/">Solaris Enterprise Edition</a>, which bundles Solaris 10, the Java Enterprise System, developer tools, desktop infrastructure and N1 management software. A recent Between the Lines blog entry by ZDNet&#39;s David Berlind waxes enthusiastic over the use of <a href="http://blogs.zdnet.com/BTL/?p=2298">Java DB embedded in a browser</a> to provide offline persistence. RedMonk analyst <a href="http://www.redmonk.com/jgovernor/archives/001151.html">James Governor</a> and <em>eWeek</em>&#39;s <a href="http://www.eweek.com/article2/0,1895,1902407,00.asp">Lisa Vaas</a> wrote about the use of Java DB as a local data store when <a href="http://www.sauria.com/blog/2005/12/13#1440">Tim Bray announced Sun&#39;s Derby derivative</a> and <a href="http://blogs.sun.com/roller/page/FrancoisOrsini?entry=derby_apachecon_demo">Francois Orsini</a> demonstrated Java DB embedded in the Firefox browser at the ApacheCon 2005 conference.</span>   <br />   <span style="font-family: Verdana;"></span>   <br />   <span style="font-family: Verdana;">    <a href="http://www.firebirdsql.org/"><strong>Firebird</strong>    </a> is derived from Borland&#39;s InterBase 6.0 code, the first commercial relational database management system (RDBMS) to be released as open source. Firebird has excellent support for SQL-92 and comes in three versions: Classic, SuperServer and Embedded for Windows, Linux, Solaris, HP-UX, FreeBSD and MacOS X. The embedded version has a 1.4-MB footprint. Release Candidate 1 for Firebird 2.0 became available on March 30, 2006 and is a major improvement over earlier versions. <a href="http://www.borland.com/us/products/interbase/index.html">Borland continues to promote InterBase</a>, now at version 7.5, as a small-footprint, embedded database with commercial Server and Client licenses.</span>   <br />   <span style="font-family: Verdana;"></span>   <br />   <span style="font-family: Verdana;">    <a href="http://www.sqlite.org/index.html"><strong>SQLite</strong>    </a> is a featherweight C library for an embedded database that implements most SQL-92 entry- and transitional-level requirements (some through the JDBC driver) and supports transactions within a tiny 250-KB code footprint. <a href="http://www.sqlite.org/cvstrac/wiki?p=SqliteWrappers">Wrappers</a> support a multitude of languages and operating systems, including Windows CE, SmartPhone, Windows Mobile, and Win32. SQLite&#39;s primary <a href="http://www.sqlite.org/omitted.html">SQL-92 limitations</a> are lack of nested transactions, inability to alter a table design once committed (other than with RENAME TABLE and ADD COLUMN operations), and foreign-key constraints. SQLite provides read-only views, triggers, and 256-bit encryption of database files. A downside is the the entire database file is <a href="http://weblogs.asp.net/jgalloway/archive/2006/04/12/442615.aspx">locked when while a transaction is in progress</a>. SQLite uses file access permissions in lieu of GRANT and REVOKE commands. Using SQLite involves no license; its code is entirely in the public domain.</span>  </p>  <p>   <span style="font-family: Verdana; font-size: 85%;">The Mozilla Foundation&#39;s <a href="http://wiki.mozilla.org/Mozilla2:Unified_Storage">Unified Storage wiki</a> says this about SQLite: &#39;SQLite will be the back end for the unified store [for Firefox]. Because it implements a SQL engine, we get querying &#39;for free&#39;, without having to invent our own query language or query execution system. Its code-size footprint is moderate (250k), but it will hopefully simplify much existing code so that the net code-size change should be smaller. It has exceptional performance, and supports concurrent access to the database. Finally, it is released into the public domain, meaning that we will have no licensing issues.&#39;</span>  </p>  <p>   <span style="font-family: verdana;">Vieka Technology, Inc.&#39;s <a href="http://vieka.com/esql.htm"><strong>eSQL 2.11</strong></a> is a port of SQLite to Windows Mobile (Pocket PC and Smartphone) and Win32, and includes development tools for Windows devices and PCs, as well as a .NET native data provider. A conventional ODBC driver also is available. eSQL for Windows (Win32) is free for personal and commercial use; eSQL for Windows Mobile requires a license for commercial (for-profit or business) use.</span>  </p>  <p>   <span style="font-family: verdana;">    <a href="http://hsqldb.org/"><strong>HSQLDB</strong>    </a> isn&#39;t on most reviewers&#39; radar, which is surprising because it&#39;s the default database for <a href="http://www.openoffice.org/">OpenOffice.org</a> (OOo) 2.0&#39;s <a href="http://www.openoffice.org/product/base.html">Base</a> suite member. HSQLDB 1.8.0.1 is an open-source (BSD license) Java dembedded database engine based on Thomas Mueller&#39;s original Hypersonic SQL Project. Using OOo&#39;s Base feature requires installing the Java 2.0 Runtime Engine (which is not open-source) or the presence of an alternative open-source engine, such as Kaffe. My prior posts about OOo Base and HSQLDB are <a href="http://oakleafblog.blogspot.com/2005/10/openoffice-base-20-vs-microsoft-access.html">here</a>, <a href="http://oakleafblog.blogspot.com/2005/10/openoffice-base-20-vs-microsoft-access_22.html">here</a> and <a href="http://oakleafblog.blogspot.com/2005/10/openoffice-20-base-matches-microsoft.html">here</a>.</span>  </p>  <p>   <span style="font-family: verdana;">The <a href="http://hsqldb.sourceforge.net/web/hsqlDocsFrame.html">HSQLDB 1.8.0 documentation</a> on SourceForge states the following regarding SQL-92 and later conformance:</span>  </p>  <span style="font-family: verdana;">   <blockquote>    <p>     <span style="font-family: verdana;">HSQLDB 1.8.0 supports the dialect of SQL defined by SQL standards 92, 99 and 2003. This means where a feature of the standard is supported, e.g. left outer join, the syntax is that specified by the standard text. Many features of SQL92 and 99 up to Advanced Level are supported and here is support for most of SQL 2003 Foundation and several optional features of this standard. However, certain features of the Standards are not supported so no claim is made for full support of any level of the standards. </span>    </p>   </blockquote>   <span style="font-family: verdana;"><span style="font-size: 85%;">Other less well-known embedded databases designed for or suited to mobile deployment are </span>    <a href="http://www.mimer.com/leftright.asp?secId=172"><span style="font-size: 85%;">Mimer SQL Mobile</span>    </a><span style="font-size: 85%;"> and </span>    <a href="http://www.vistadb.net/"><span style="font-size: 85%;">VistaDB 2.1</span>    </a><span style="font-size: 85%;">. Neither product is open-source and require paid licensing; VistaDB requires a small up-front payment by developers but offers royalty-free distribution.</span>   </span> <br /> <br /> <span style="font-family: Verdana;">Java DB, Firebird embedded, SQLite and eSQL 2.11 are contenders for lightweight PC and mobile device database projects that aren&#39;t Windows-only.</span> <br /> <br />   <strong>    <span style="font-family: verdana;">SQL Server 2005 Everywhere<br />    </span><span style="font-family: Verdana;"></span>   </strong> <br /> <span style="font-family: verdana;">If you&#39;re a Windows developer, SQL Server Mobile is the logical embedded database choice for mobile applications for Pocket PCs and Smartphones. Microsoft&#39;s April 19, 2006 press release delivered the news that SQL Server 2005 Mobile Editon (SQL Mobile or SSM) would gain a big brotherâSQL Server 2005 Everywhere Edition. </span> <br /> <span style="font-family: verdana;"></span> <br /> <span style="font-family: verdana;">Currently, the SSM client is licensed (at no charge) to run in production on devices with Windows CE 5.0, Windows Mobile 2003 for Pocket PC or Windows Mobile 5.0, or on PCs with Windows XP Tablet Edition only. SSM also is licensed for development purposes on PCs running Visual Studio 2005.</span>   <span style="font-family: verdana;"> Smart Device replication with SQL Server 2000 SP3 and later databases has been the most common application so far for SSM.<br /> <br />   </span><span style="font-family: verdana;">By the end of 2006, Microsoft will license SSE for use on <em>all</em> PCs running any Win32 version or the preceding device OSs. A version of SQL Server Management Studio Express (SSMSE)âupdated to support SSEâis expected to release by the end of the year. These features will qualify SSE as <em>the universal embedded database</em> for Windows client and smart-device applications. </span> <br /> <br /> <span style="font-family: verdana;">For more details on SSE, read <a href="http://weblogs.asp.net/jgalloway/archive/2006/04/11/442451.aspx">John Galloway&#39;s April 11, 2006 blog post</a> and my &#39;<a href="http://www.ftponline.com/special/sqlserver/rjennings-mobile/">SQL Server 2005 Mobile Goes Everywhere</a>&#39; article for the <a href="http://www.ftponline.com/special/sqlserver/">FTPOnline Special Report on SQL Server</a>.</span><span style="font-family: verdana;"></span>&quot;  <p>(Via <a href="http://oakleafblog.blogspot.com">OakLeaf Systems</a>.)</p>  </span> </blockquote> 
]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2006-04-28#965">
  <rss:title>My podcast conversation with Jon Udell </rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2006-04-28T14:43:12Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Jon and I had a recent chat yesterday that is now available in Podcast form. &quot;In my fourth Friday podcast we hear from Kingsley Idehen, CEO of OpenLink Software. I wrote about OpenLink&#39;s universal database and app server, Virtuoso, back in 2002 and 2003. Earlier this month Virtuoso became the first mature SQL/XML hybrid to make the transition to open source. The latest incarnation of the product also adds SPARQL (a semantic web query language) to its repertoire. ...&quot; (Via Jon&#39;s Radio.) I would like to make an important clarification re. the GData Protocol and what is popularly dubbed as &quot;Adam Bosworth&#39;s fingerprints.&quot; I do not believe in a one solution (a simple one for the sake of simplicity) to a deceptively complex problem. Virtuoso supports Atom 1.0 (syndication only at the current time) and Atom 0.3 (syndication and publication which have been in place for years). BTW - the GData Protocol and Atom 1.0 publishing support will be delivered in both the Open Source and Commercial Edition updates to Virtuoso next week (very little work due to what&#39;s already in place). I make the clarification above to eliminate the possibility of assuming mutual exclusivity of my perspective/vison and Adam&#39;s (Jon also makes this important point when he speaks about our opinions being on either side of a spectrum/continuum). I simply want to broaden the scope of this discussion. I am a profound believer in the Semantic Web / Data Web vision, and I predict that we will be querying the Googlebase via SPARQL in the not to distant future (this doesn&#39;t mean that netizens will be forced to master SPARQL, absolutely not! But there will be conduit technologies that deal with matter). Side note: I actually last spoke with Adam at the NY Hilton in 2000 (the day I unveiled Virtuoso to the public for the first time, in person). We bumped into each other and I told him about Virtuoso (at the time the big emphasis was SQL to XML and the vocabulary we had chosen re. SQL extension...), and he told me about his departure from Microsoft and the commencement of his new venture (CrossGain prior to his stint at BEA), what struck me even more was his interest in Linux and Open Source (bearing in mind this was about 3 or so week after he departed Microsoft.) If you are encountering Virtuoso for the first time via this post or Jon&#39;s, please make time to read the product history article on the Virtuoso Wiki (which is one of many Virtuoso based applications that make up our soon to be released OpenLink DataSpace offering). That said, I better go listen to the podcast :-)</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p>Jon and I had a recent chat yesterday that is now available in <a href="http://weblog.infoworld.com/udell/2006/04/28.html#a1437">Podcast</a> form.</p>
<blockquote>
 <cite><p>&quot;In my <a href="http://weblog.infoworld.com/udell/gems/ju_idehen.mp3">fourth Friday podcast</a> we hear from Kingsley Idehen, CEO of <a href="http://openlinksw.com/">OpenLink Software</a>. I wrote about OpenLink&#39;s universal database and app server, Virtuoso, back in <a href="http://www.infoworld.com/article/02/04/12/020415plvirtuoso_1.html">2002</a> and <a href="http://www.infoworld.com/article/03/03/21/12virtuoso_1.html">2003</a>. Earlier this month Virtuoso became the first mature SQL/XML hybrid to make the <a href="http://www.openlinksw.com/blog/~kidehen/?id=951">transition to open source</a>. The latest incarnation of the product also adds SPARQL (a semantic web query language) to its repertoire.
 <b>...</b>&quot;</p>
<p>(Via <a href="http://weblog.infoworld.com/udell/">Jon&#39;s Radio</a>.)</p>
 </cite>
</blockquote>

I would like to make an important clarification re. the GData Protocol and what is popularly dubbed as &quot;<a href="http://jeremy.zawodny.com/blog/archives/006687.html">Adam Bosworth&#39;s fingerprints.</a>&quot; I do not believe in a one solution (a simple one for the sake of simplicity) to a deceptively complex problem. Virtuoso supports Atom 1.0 (syndication only at the current time) and Atom 0.3 (syndication and publication which have been in place for years). 

<blockquote>BTW - the GData Protocol and Atom 1.0 publishing support will be delivered in both the Open Source and Commercial Edition updates to Virtuoso next week (very little work due to what&#39;s already in place).</blockquote>
<p>I make the clarification above to eliminate the possibility of assuming mutual exclusivity of my perspective/vison and Adam&#39;s (Jon also makes this important point when he speaks about our opinions being on either side of a spectrum/continuum). I simply want to broaden the scope of this discussion. I am a profound believer in the Semantic Web / Data Web vision, and I predict that we will be querying the Googlebase via SPARQL in the not to distant future (this doesn&#39;t mean that netizens will be forced to master SPARQL, absolutely not! But there will be conduit technologies that deal with matter).</p>
<p>Side note: I actually last spoke with Adam at the NY Hilton in 2000 (the day I unveiled Virtuoso to the public for the first time, in person). We bumped into each other and I told him about Virtuoso (at the time the big emphasis was SQL to XML and the vocabulary we had chosen re. SQL extension...), and he told me about his departure from Microsoft and the commencement of his new venture (CrossGain prior to his stint at BEA), what struck me even more was his interest in Linux and Open Source (bearing in mind this was about 3 or so week after he departed Microsoft.)</p>
<p>If you are encountering Virtuoso for the first time via this post or Jon&#39;s, please make time to read the <a href="http://virtuoso.openlinksw.com/wiki/main/Main/VOSHistory/">product history</a> article on the <a href="http://virtuoso.openlinksw.com/wiki/main/Main/">Virtuoso Wiki</a> (which is one of many Virtuoso based applications that make up our soon to be released OpenLink DataSpace offering).</p>
<p>That said, I better go listen to the podcast :-)</p>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2006-04-28#993">
  <rss:title>My podcast conversation with Jon Udell</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2006-04-28T14:43:12Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Jon and I had a recent chat yesterday that is now available in Podcast form. &quot;In my fourth Friday podcast we hear from Kingsley Idehen, CEO of OpenLink Software. I wrote about OpenLink&#39;s universal database and app server, Virtuoso, back in 2002 and 2003. Earlier this month Virtuoso became the first mature SQL/XML hybrid to make the transition to open source. The latest incarnation of the product also adds SPARQL (a semantic web query language) to its repertoire. ...&quot; (Via Jon&#39;s Radio.) I would like to make an important clarification re. the GData Protocol and what is popularly dubbed as &quot;Adam Bosworth&#39;s fingerprints.&quot; I do not believe in a one solution (a simple one for the sake of simplicity) to a deceptively complex problem. Virtuoso supports Atom 1.0 (syndication only at the current time) and Atom 0.3 (syndication and publication which have been in place for years). BTW - the GData Protocol and Atom 1.0 publishing support will be delivered in both the Open Source and Commercial Edition updates to Virtuoso next week (very little work due to what&#39;s already in place). I make the clarification above to eliminate the possibility of assuming mutual exclusivity of my perspective/vison and Adam&#39;s (Jon also makes this important point when he speaks about our opinions being on either side of a spectrum/continuum). I simply want to broaden the scope of this discussion. I am a profound believer in the Semantic Web / Data Web vision, and I predict that we will be querying the Googlebase via SPARQL in the not to distant future (this doesn&#39;t mean that netizens will be forced to master SPARQL, absolutely not! But there will be conduit technologies that deal with matter). Side note: I actually last spoke with Adam at the NY Hilton in 2000 (the day I unveiled Virtuoso to the public for the first time, in person). We bumped into each other and I told him about Virtuoso (at the time the big emphasis was SQL to XML and the vocabulary we had chosen re. SQL extension...), and he told me about his departure from Microsoft and the commencement of his new venture (CrossGain prior to his stint at BEA), what struck me even more was his interest in Linux and Open Source (bearing in mind this was about 3 or so week after he departed Microsoft.) If you are encountering Virtuoso for the first time via this post or Jon&#39;s, please make time to read the product history article on the Virtuoso Wiki (which is one of many Virtuoso based applications that make up our soon to be released OpenLink DataSpace offering). That said, I better go listen to the podcast :-)</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
 <p>Jon and I had a recent chat yesterday that is now available in <a href="http://weblog.infoworld.com/udell/2006/04/28.html#a1437">Podcast</a> form.</p> <blockquote>  <cite></cite> <p>&quot;In my <a href="http://weblog.infoworld.com/udell/gems/ju_idehen.mp3">fourth Friday podcast</a> we hear from Kingsley Idehen, CEO of <a href="http://openlinksw.com/">OpenLink Software</a>. I wrote about OpenLink&#39;s universal database and app server, Virtuoso, back in <a href="http://www.infoworld.com/article/02/04/12/020415plvirtuoso_1.html">2002</a> and <a href="http://www.infoworld.com/article/03/03/21/12virtuoso_1.html">2003</a>. Earlier this month Virtuoso became the first mature SQL/XML hybrid to make the <a href="http://www.openlinksw.com/blog/%7Ekidehen/?id=951">transition to open source</a>. The latest incarnation of the product also adds SPARQL (a semantic web query language) to its repertoire.  <b>...</b>&quot;</p> <p>(Via <a href="http://weblog.infoworld.com/udell/">Jon&#39;s Radio</a>.)</p>   </blockquote>  I would like to make an important clarification re. the GData Protocol and what is popularly dubbed as &quot;<a href="http://jeremy.zawodny.com/blog/archives/006687.html">Adam Bosworth&#39;s fingerprints.</a>&quot; I do not believe in a one solution (a simple one for the sake of simplicity) to a deceptively complex problem. Virtuoso supports Atom 1.0 (syndication only at the current time) and Atom 0.3 (syndication and publication which have been in place for years).   <blockquote>BTW - the GData Protocol and Atom 1.0 publishing support will be delivered in both the Open Source and Commercial Edition updates to Virtuoso next week (very little work due to what&#39;s already in place).</blockquote> <p>I make the clarification above to eliminate the possibility of assuming mutual exclusivity of my perspective/vison and Adam&#39;s (Jon also makes this important point when he speaks about our opinions being on either side of a spectrum/continuum). I simply want to broaden the scope of this discussion. I am a profound believer in the Semantic Web / Data Web vision, and I predict that we will be querying the Googlebase via SPARQL in the not to distant future (this doesn&#39;t mean that netizens will be forced to master SPARQL, absolutely not! But there will be conduit technologies that deal with matter).</p> <p>Side note: I actually last spoke with Adam at the NY Hilton in 2000 (the day I unveiled Virtuoso to the public for the first time, in person). We bumped into each other and I told him about Virtuoso (at the time the big emphasis was SQL to XML and the vocabulary we had chosen re. SQL extension...), and he told me about his departure from Microsoft and the commencement of his new venture (CrossGain prior to his stint at BEA), what struck me even more was his interest in Linux and Open Source (bearing in mind this was about 3 or so week after he departed Microsoft.)</p> <p>If you are encountering Virtuoso for the first time via this post or Jon&#39;s, please make time to read the <a href="http://virtuoso.openlinksw.com/wiki/main/Main/VOSHistory">product history</a> article on the <a href="http://virtuoso.openlinksw.com/wiki/main/">Virtuoso Wiki</a> (which is one of many Virtuoso based applications that make up our soon to be released OpenLink DataSpace offering).</p> <p>That said, I better go listen to the podcast :-)</p> 
]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2006-04-11#951">
  <rss:title>Virtuoso is Officially Open Source!</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2006-04-11T18:01:44Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">I am pleased to unveil (officially) the fact that Virtuoso is now available in Open Source form. What Is Virtuoso? A powerful next generation server product that implements otherwise distinct server functionality within a single server product. Think of Virtuoso as the server software analog of a dual core processor where each core represents a traditional server functionality realm. Where did it come from? The Virtuoso History page tells the whole story. What Functionality Does It Provide? The following: 1. Object-Relational DBMS Engine (ORDBMS like PostgreSQL and DBMS engine like MySQL) 2. XML Data Management (with support for XQuery, XPath, XSLT, and XML Schema) 3. RDF Triple Store (or Database) that supports SPARQL (Query Language, Transport Protocol, and XML Results Serialization format) 4. Service Oriented Architecture (it combines a BPEL Engine with an ESB) 5. Web Application Server (supports HTTP/WebDAV) 6. NNTP compliant Discussion Server And more. (see: Virtuoso Web Site) 90% of the aforementioned functionality has been available in Virtuoso since 2000 with the RDF Triple Store being the only 2006 item. What Platforms are Supported The Virtuoso build scripts have been successfully tested on Mac OS X (Universal Binary Target), Linux, FreeBSD, and Solaris (AIX, HP-UX, and True64 UNIX will follow soon). A Windows Visual Studio project file is also in the works (ETA some time this week). Why Open Source? Simple, there is no value in a product of this magnitude remaining the &quot;best kept secret&quot;. That status works well for our competitors, but absolutely works against the legions of new generation developers, systems integrators, and knowledge workers that need to be aware of what is actually achievable today with the right server architecture. What Open Source License is it under? GPL version 2. What&#39;s the business model? Dual licensing. The Open Source version of Virtuoso includes all of the functionality listed above. While the Virtual Database (distributed heterogeneous join engine) and Replication Engine (across heterogeneous data sources) functionality will only be available in the commercial version. Where is the Project Hosted? On SourceForge. Is there a product Blog? Of course! Up until this point, the Virtuoso Product Blog has been a covert live demonstration of some aspects of Virtuoso (Content Management). My Personal Blog and the Virtuoso Product Blog are actual Virtuoso instances, and have been so since I started blogging in 2003. Is There a product Wiki? Sure! The Virtuoso Product Wiki is also an instance of Virtuoso demonstrating another aspect of the Content Management prowess of Virtuoso. What About Online Documentation? Yep! Virtuoso Online Documentation is hosted via yet another Virtuoso instance. This particular instance also attempts to demonstrate Free Text search combined with the ability to repurpose well formed content in a myriad of forms (Atom, RSS, RDF, OPML, and OCS). What about Tutorials and Demos? The Virtuoso Online Tutorial Site has operated as a live demonstration and tutorial portal for a numbers of years. During the same timeframe (circa. 2001) we also assembled a few Screencast style demos (their look feel certainly show their age; updates are in the works). BTW - We have also updated the Virtuoso FAQ and also released a number of missing Virtuoso White Papers (amongst many long overdue action items).</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<p>I am pleased to unveil (officially) the fact that <a href="http://www.prnewswire.com/cgi-bin/stories.pl?ACCT=104&STORY=/www/story/04-11-2006/0004338324&EDATE=">Virtuoso is now available in Open Source form</a>.</p> <p></p> <h4>What Is Virtuoso?</h4> <p>A powerful next generation server product that implements otherwise distinct server functionality within a single server product. Think of Virtuoso as the server software analog of a dual core processor where each core represents a traditional server functionality realm.</p> <p></p> <h4>Where did it come from?</h4> <p>The <a href="http://virtuoso.openlinksw.com/wiki/main/Main/VOSHistory">Virtuoso History page</a> tells the whole story.</p> <p></p> <h4>What Functionality Does It Provide?</h4>  The following: <ul> 1. Object-Relational DBMS Engine (ORDBMS like PostgreSQL and DBMS engine like MySQL) </ul> <ul> 2. XML Data Management (with support for XQuery, XPath, XSLT, and XML Schema) </ul> <ul> 3. RDF Triple Store (or Database) that supports SPARQL (Query Language, Transport Protocol, and XML Results Serialization format) </ul> <ul> 4. Service Oriented Architecture (it combines a BPEL Engine with an ESB) </ul> <ul> 5. Web Application Server (supports HTTP/WebDAV) </ul> <ul> 6. NNTP compliant Discussion Server </ul>  And more. (see: <a href="http://virtuoso.openlinksw.com">Virtuoso Web Site</a>) <p> 90% of the aforementioned functionality has been available in Virtuoso since 2000 with the RDF Triple Store being the only 2006 item.</p> <p></p> <h4>What Platforms are Supported</h4> <p> The Virtuoso build scripts have been successfully tested on Mac OS X (Universal Binary Target), Linux, FreeBSD, and Solaris (AIX, HP-UX, and True64 UNIX will follow soon). A Windows Visual Studio project file is also in the works (ETA some time this week).</p> <p></p> <h4>Why Open Source?</h4> <p>Simple, there is no value in a product of this magnitude remaining the &quot;best kept secret&quot;. That status works well for our competitors, but absolutely works against the legions of new generation developers, systems integrators, and knowledge workers that need to be aware of what is actually achievable today with the right server architecture.</p> <p></p> <h4>What Open Source License is it under?</h4> <p>GPL version 2.</p> <p></p> <h4>What&#39;s the business model?</h4> <p>Dual licensing.</p> <p>The Open Source version of Virtuoso includes all of the functionality listed above. While the Virtual Database (distributed heterogeneous join engine) and Replication Engine (across heterogeneous data sources) functionality will only be available in the commercial version. </p> <p></p> <h4>Where is the Project Hosted?</h4> <p>On <a href="http://sourceforge.net/projects/virtuoso">SourceForge.</a> </p> <p></p> <h4>Is there a product Blog?</h4> <p>Of course! </p> <p>Up until this point, the <a href="http://virtuoso.openlinksw.com/blog/">Virtuoso Product Blog</a> has been a covert live demonstration of some aspects of Virtuoso (Content Management). My Personal Blog and the Virtuoso Product Blog are actual Virtuoso instances, and have been so since I started blogging in 2003.</p> <p>Is There a product Wiki?</p> <p>Sure! <a href="http://virtuoso.openlinksw.com/wiki/main/">The Virtuoso Product Wiki</a> is also an instance of Virtuoso demonstrating another aspect of the Content Management prowess of Virtuoso.</p> <p></p> <h4>What About Online Documentation?</h4> <p>Yep! <a href="http://docs.openlinksw.com/virtuoso/">Virtuoso Online Documentation</a> is hosted via yet another Virtuoso instance. This particular instance also attempts to demonstrate Free Text search combined with the ability to repurpose well formed content in a myriad of forms (Atom, RSS, RDF, OPML, and OCS).</p> <p></p> <h4>What about Tutorials and Demos?</h4> <p>The <a href="http://demo.openlinksw.com/tutorial/">Virtuoso Online Tutorial</a> Site has operated as a live demonstration and tutorial portal for a numbers of years. During the same timeframe (circa. 2001) we also assembled a few Screencast style demos (their look feel certainly show their age; updates are in the works).</p> <p>BTW - We have also updated the <a href="http://virtuoso.openlinksw.com/FAQ/">Virtuoso FAQ</a> and also released a number of missing <a href="http://virtuoso.openlinksw.com/Whitepapers/">Virtuoso White Papers</a> (amongst many long overdue action items).</p>
]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2006-03-14#939">
  <rss:title>New XTech web site, and why we don&#39;t sell presentation space</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2006-03-14T21:24:26Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">New XTech web site, and why we don&#39;t sell presentation space: &quot; My too-long absence from writing much here can be ascribed to two, differently pleasant, activities. First, a fantastic vacation in Cuba, and second, the redesign and launch of the XTech web site. Of the first, come to my place for dinner and I&#39;ll bore you at length about how amazing it was. Of the second, I&#39;d like to bore you right now! Thanks to Ruby on Rails and a few late nights, the XTech site now has these new features: Full conference schedule (apart from 6 Mozilla talks I&#39;m still nailing down) A blog. With go-faster Atom 1.0 stripes and everything! Details on the newly-added Ajax Developers&#39; Day. A few more details on the Ajax Developers&#39; Day. As I mentioned before, when putting together the schedule we felt there was a lot of excellent content still missed out (I&#39;m still feeling guilty at having rejected proposals from many good friends and excellent speakers). So, we put together an extra day at the beginning of the conference where we could go further into detail on Ajax technologies. This day, featuring speakers such as Simon Willison from Yahoo!, XML expert Kurt Cagle and OpenLaszlo&#39;s Max Carlson, will allow those working on Ajax projects--either deployment or toolkits--to meet, discuss best practice and move forward on new ideas. Although it&#39;s a day-long event, we didn&#39;t want to make the price tag as high as a full-day tutorial, so you can register for the cost of a half-day tutorial. A few implementation details If that all sounded a little like advertising, here are some technical details worth sharing. The site&#39;s CMS is built on Ruby on Rails. Development was done on Linux, with the help of WINE to check out the view from Internet Explorer. The newsletter is managed by the absurdly wonderful CampaignMonitor. This conference not for sale Before I went on vacation, there was some debate in various quarters about paid-for plenary and keynote slots in conferences. Though I hope it is obvious, I wanted to state where I, and thus the XTech conference, stand on this issue. It has always been my policy to maintain a strict separation between the commercial and editorial aspects of XTech. Although each year there&#39;s always a company who thinks they can buy a speaking slot, I never let this happen. The content of the conference is formed by editorial selection by the programme committee, who take the scores from the peer review panel as their primary guide. Aside from what I hope shows in the excellent quality of the talks and generally interesting keynotes (yes, we get it wrong occasionally!), there are two effects on the conference. Sponsors are that much more respected. When a sponsor respects the delegates&#39; time and intelligence, but still attends, you know they&#39;re serious about engagement with attendees. A higher portion of the conference cost is in the registration fees than for some other conferences. We&#39;re still trying to keep the costs as low as we can, but we&#39;re not prepared to compromise the quality of the schedule by letting vendors buy talk time. I hope this explains a little of my position. As a stance, it often creates more issues for me than it solves, but I believe it preserves XTech&#39;s reputation as a conference where you can hear some of the best no-fluff presentations on web technology.&quot; (Via Edd Dumbill&#39;s Weblog: Behind the Times.)</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p>
<a href="http://times.usefulinc.com/2006/03/14-xtech">New XTech web site, and why we don&#39;t sell presentation space</a>: &quot;</p>
<p>My too-long absence from writing much here can be ascribed to two, differently pleasant, activities. First, a fantastic vacation in Cuba, and second, the redesign and launch of the <a href="http://xtech06.usefulinc.com/">XTech web site</a>.</p>
<p>Of the first, come to my place for dinner and I&#39;ll bore you at length about how amazing it was. Of the second, I&#39;d like to bore you right now!</p>
<p>Thanks to Ruby on Rails and a few late nights, the XTech site now has these new features:</p>
<ul>
<li>
  <a href="http://xtech06.usefulinc.com/schedule">Full conference schedule</a> (apart from 6 Mozilla talks I&#39;m still nailing down)</li>
<li>
  <a href="http://xtech06.usefulinc.com/">A blog</a>. With go-faster Atom 1.0 stripes and everything!</li>
<li>Details on the newly-added <a href="http://xtech06.usefulinc.com/content/ajax">Ajax Developers&#39; Day</a>.</li>
</ul>
<p>A few more details on the Ajax Developers&#39; Day. As I mentioned before, when putting together the schedule we felt there was a lot of excellent content still missed out (I&#39;m still feeling guilty at having rejected proposals from many good friends and excellent speakers). So, we put together an extra day at the beginning of the conference where we could go further into detail on Ajax technologies.</p>
<p>This day, featuring speakers such as Simon Willison from Yahoo!, XML expert Kurt Cagle and OpenLaszlo&#39;s Max Carlson, will allow those working on Ajax projects--either deployment or toolkits--to meet, discuss best practice and move forward on new ideas. Although it&#39;s a day-long event, we didn&#39;t want to make the price tag as high as a full-day tutorial, so you can <a href="http://xtech06.usefulinc.com/content/registration">register</a> for the cost of a half-day tutorial.</p>
<h4>A few implementation details</h4>
<p>If that all sounded a little like advertising, here are some technical details worth sharing. The site&#39;s CMS is built on Ruby on Rails. Development was done on Linux, with the help of WINE to check out the view from Internet Explorer. The <a href="http://xtech06.usefulinc.com/public/newsletter">newsletter</a> is managed by the absurdly wonderful <a href="http://www.campaignmonitor.com/">CampaignMonitor</a>.</p>
<h4>This conference not for sale</h4>
<p>Before I went on vacation, there was some debate in various quarters about paid-for plenary and keynote slots in conferences. Though I hope it is obvious, I wanted to state where I, and thus the XTech conference, stand on this issue.</p>
<p>It has always been my policy to maintain a strict separation between the commercial and editorial aspects of XTech. Although each year there&#39;s always a company who thinks they can buy a speaking slot, I never let this happen. The content of the conference is formed by editorial selection by the programme committee, who take the scores from the peer review panel as their primary guide.</p>
<p>Aside from what I hope shows in the excellent quality of the talks and generally interesting keynotes (yes, we get it wrong occasionally!), there are two effects on the conference.</p>
<ul>
 <li>Sponsors are that much more respected. When a sponsor respects the delegates&#39; time and intelligence, but still attends, you know they&#39;re serious about engagement with attendees.<br />
 </li>
<li>A higher portion of the conference cost is in the registration fees than for some other conferences. We&#39;re still trying to keep the costs as low as we can, but we&#39;re not prepared to compromise the quality of the schedule by letting vendors buy talk time. </li>
</ul>I hope this explains a little of my position. As a stance, it often creates more issues for me than it solves, but I believe it preserves XTech&#39;s reputation as a conference where you can hear some of the best no-fluff presentations on web technology.<br />&quot;

<p>(Via <a href="http://times.usefulinc.com/">Edd Dumbill&#39;s Weblog: Behind the Times</a>.)</p>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2006-02-22#936">
  <rss:title>Contd: Windows/Linux/OSX Co-existence on MacIntels</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2006-02-22T19:50:05Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">More notes and findings from the Mac OS X Internals Book site.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[More notes and findings from the <a href="http://www.osxbook.com/book/bonus/misc/linux/">Mac OS X Internals Book site</a>.]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2006-01-18#924">
  <rss:title>Windows/Linux on MacIntel Race is on!</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2006-01-18T22:54:57Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">As indicated in an earlier post, the real sweet spot for the recently announced MacIntels is going to be delivery of Mac OS X (which covers BSD), Linux, Solaris, and Windows running &quot;side by side&quot; nirvana (no dual booting). OpenOSX is first off the mark (at least publicly) from the emulator camp, but there many others to come! Anyway, I need to go test this for myself before I comment any further (I hate speculating without hands on experience).</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
As indicated in an <a href="http://www.openlinksw.com/blog/%7Ekidehen/index.vspx?page=&id=922">earlier post</a>, the real sweet spot for the recently announced MacIntels is going to be delivery of Mac OS X (which covers BSD), Linux, Solaris, and Windows running &quot;side by side&quot; nirvana (no dual booting).   <a href="http://www.openosx.com/wintel/index.html">OpenOSX</a> is first off the mark (at least publicly) from the emulator camp, but there many others to come! Anyway, I need to go test this for myself before I comment any further (I hate speculating without hands on experience). 
]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2006-01-11#922">
  <rss:title>As We Get Closer to Mac/Linux/Windows/Solaris MacIntels :-)</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2006-01-11T22:37:35Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Quick note to self and others interested in this inevitable nirvana: The new MacBook Pro&#39;s from Apple include support for Intel&#39;s EFI Bios.(Spotter: Digg) . Related Commentary: The emerging view is that EFI is a subtle mechanism for locking out Windows (since it doesn&#39;t support EFI in its x86 versions. And when it does, it only applies to the IA64 variants). Well, Linux handles EFI, and I assume that VMWare and others more than likely grok this already. Thus, we can hope that OS Virtualization players are getting revved up to provide even clearer justification for their existence by opening the gates to this Nirvana!</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p>Quick note to self and others interested in this inevitable nirvana: The new <a href="http://www.apple.com/macbookpro/">MacBook Pro</a>&#39;s from <a href="http://www.apple.com">Apple</a> include support for <a href="http://www.intel.com">Intel</a>&#39;s <a href="http://www.intel.com/technology/efi/">EFI Bios</a>.</p><p>(Spotter: <a href="http://digg.com/apple">Digg</a>) .</p>

<p>Related Commentary: The emerging view is that EFI is a subtle mechanism for locking out Windows (since it doesn&#39;t support EFI in its x86 versions. And when it does, it only applies to the IA64 variants). Well, Linux handles EFI, and I assume that VMWare and others more than likely grok this already. Thus, we can hope that OS Virtualization players are getting revved up to provide even clearer justification for their existence by opening the gates to this Nirvana!</p>
]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2005-11-16#904">
  <rss:title>Saving the Net from the pipeholders</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2005-11-16T18:23:13Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">An interesting post that I have place verbatim for the following reasons: 1. Its Importance (generally speaking)2. Lot&#39;s of Link Love (A-List Blogger Style see: LinkBlog and Summary to see what My Blog does with these links)3. Time-to-show on Memeorandum (how, when, and if at all, are results that are of personal interest)Anyway, read the post from Doc Searls titled: Saving the Net from the pipeholders&quot;I&#39;ve spent much of the last two weeks writing an essay that just went up at Linux Journal: Saving the Net: How to Keep the Carriers from Flushing the Net Down the Tubes. It&#39;s probably the longest post I&#39;ve ever put up on the Web. It&#39;s certainly the most important. And not just to me.I started writing it after a recent surprise visit by David Isenberg to Santa Barbara. He&#39;s the one who got me â and, I hope, us â going.I finished writing it yesterday after David Berlind published threeexcellentpieces, which I highly recommend reading, and acting upon.For guidance during the rest of this thing (whether they knew it or not), I also want to thank David Weinberger, Dave Winer, Steve Gillmor, Kevin Werbach, Cory Doctorow, Don Marti, Richard M. Stallman, Eric S. Raymond, Susan Crawford, Larry Lessig, John Palfrey, Chris Nolan, Jeff Jarvis, Craig Burton, Andrew Sullivan, Paul Kunz, Dean Landsman, Matt Welch, Sheila Lennon, George Lakoff, Om Malik, Phil Hughes, J.D. Lasica, Virginia Postrel, Chris Anderson, Esther Dyson, Jim Thompson, Micah Sifry, John Perry Barlow, The EFF, the Berkman Center, the Personal Democracy Forum and others I&#39;m overlooking but will fill in later when I have the time.Although it&#39;s kinda huge, Saving the Net wasn&#39;t written as a Finished Work, but rather as a conversation starter â a way to change a rock we&#39;re pushing uphill to a snowball we&#39;re rolling downhill.Larry Lessig started rolling it at OSCON in 2002, and in various other ways before that, and the whole thing has been too damn sisyphean for too damn long. Time to change that.There&#39;s a thesis involved: that the Net is in danger of becoming what Kevin Werbachcalls&#39;a private toiled garden for the phone companies&#39;, but that the real enemy is in how we understand the Net itself. We have choices there, and those choices may mean life or death for the Net as most of us have known it â and taken it for granted â for the last decade or more.A couple days ago I spoke to a group of about thirty local citizens here in Santa Barbara County, gathered in the County supervisors&#39; conference room to discuss forming a broadband task force. Early on, I asked people what the Net was. The answers were varied, but had one thing in common: it was a place, and not just fiber and copper.&quot;</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p>An interesting post that I have place verbatim for the following reasons:
</p><ul>1. Its Importance (generally speaking)</ul><ul>2. Lot&#39;s of Link Love (A-List Blogger Style see: <a href="http://www.openlinksw.com/blog/~kidehen/index.vspx?page=linkblog">LinkBlog</a> and <a href="http://www.openlinksw.com/blog/~kidehen/index.vspx?page=summary">Summary</a> to see what <a href="http://www.openlinksw.com/blog/~kidehen">My Blog</a> does with these links)</ul><ul>3. Time-to-show on <a href="http://memeorandum.com">Memeorandum</a> (how, when, and if at all, are results that are of personal interest)</ul><p>Anyway, read the post from <a href="http://doc.weblogs.com/">Doc Searls</a> titled: <a href="http://doc.weblogs.com/2005/11/16#savingTheNetFromThePipeholders">Saving the Net from the pipeholders</a></p><p>&quot;I&#39;ve spent much of the last two weeks writing an essay that just went up at <a href="http://linuxjournal.com">Linux Journal</a>: <a href="http://www.linuxjournal.com/article/8673">Saving the Net: How to Keep the Carriers from Flushing the Net Down the Tubes</a>. It&#39;s probably the longest post I&#39;ve ever put up on the Web. It&#39;s certainly the most important. And not just to me.</p><p>I started writing it after a recent surprise visit by <a href="http://www.isen.com/blog/">David Isenberg</a> to Santa Barbara. He&#39;s the one who got me â and, I hope, us â going.</p><p>I finished writing it yesterday after <a href="http://blogs.zdnet.com/BTL/">David Berlind</a> published <a href="http://blogs.zdnet.com/BTL/?p=2160">three</a><a href="http://blogs.zdnet.com/BTL/?p=2161">excellent</a><a href="http://blogs.zdnet.com/BTL/?p=2157">pieces</a>, which I highly recommend reading, and acting upon.</p><p>For guidance during the rest of this thing (whether they knew it or not), I also want to thank <a href="http://www.hyperorg.com/blogger/">David Weinberger</a>, <a href="http://scripting.com/">Dave Winer</a>, <a href="http://blogs.zdnet.com/Gillmor/">Steve Gillmor</a>, <a href="http://werblog.com/">Kevin Werbach</a>, <a href="http://craphound.com/">Cory Doctorow</a>, <a href="http://zgp.org/~dmarti/">Don Marti</a>, <a href="http://www.stallman.org/">Richard M. Stallman</a>, <a href="http://esr.ibiblio.org/">Eric S. Raymond</a>, <a href="http://scrawford.blogware.com/blog">Susan Crawford</a>, <a href="http://lessig.org/blog/">Larry Lessig</a>, <a href="http://blogs.law.harvard.edu/palfrey/">John Palfrey</a>, <a href="http://www.spot-on.com/nolan/">Chris Nolan</a>, <a href="http://www.buzzmachine.com/">Jeff Jarvis</a>, <a href="http://www.craigburton.com/">Craig Burton</a>,<a href="http://www.andrewsullivan.com/">  Andrew Sullivan</a>, <a href="http://arstechnica.com/news.ars/post/20011210-2489.html">Paul Kunz</a>, <a href="http://blog.deanland.com/">Dean Landsman</a>, <a href="http://www.mattwelch.com/warblog.html">Matt Welch</a>, <a href="http://www.projo.com/shenews">Sheila Lennon</a>, <a href="http://www.georgelakoff.com/">George Lakoff</a>, <a href="http://gigaom.com/">Om Malik</a>, <a href="http://www.ssc.com/xstatic/corporate/staff/phil.html">Phil Hughes</a>, <a href="http://www.newmediamusings.com/">J.D. Lasica</a>, <a href="http://www.dynamist.com/weblog/">Virginia Postrel</a>, <a href="http://longtail.typepad.com/the_long_tail/">Chris Anderson</a>, <a href="http://www.release1-0.com/esther/">Esther Dyson</a>, <a href="http://www.smallworks.com/">Jim Thompson</a>, <a href="http://micah.sifry.com/">Micah Sifry</a>, <a href="http://blog.barlowfriendz.net/">John Perry Barlow</a>, <a href="http://www.eff.org/">The EFF</a>, <a href="http://cyber.law.harvard.edu">the Berkman Center</a>, the <a href="http://www.personaldemocracy.com/">Personal Democracy Forum</a> and others I&#39;m overlooking but will fill in later when I have the time.</p><p>Although it&#39;s kinda huge, <a href="http://www.linuxjournal.com/article/8673">Saving the Net</a> wasn&#39;t written as a Finished Work, but rather as a conversation starter â a way to change a rock we&#39;re pushing uphill to a <a href="http://doc.weblogs.com/2005/03/28#betOnTheSnowball">snowball</a> we&#39;re rolling downhill.</p><p><a href="http://randomfoo.net/oscon/2002/lessig/">Larry Lessig started rolling</a> it at OSCON in 2002, and in various other ways before that, and the whole thing has been too damn <a href="http://en.wikipedia.org/wiki/Sisyphus">sisyphean</a> for too damn long. Time to change that.</p><p>There&#39;s a thesis involved: that the Net is in danger of becoming what <a href="http://werblog.com/">Kevin Werbach</a><a href="http://werbach.com/blog/archives/2005/11/not_the_interne.html">calls</a>&#39;a private toiled garden for the phone companies&#39;, but that the real enemy is in how we understand the Net itself. We have choices there, and those choices may mean life or death for the Net as most of us have known it â and taken it for granted â for the last decade or more.</p><p>A couple days ago I spoke to a group of about thirty local citizens here in Santa Barbara County, gathered in the County supervisors&#39; conference room to discuss forming a broadband task force. Early on, I asked people what the Net was. The answers were varied, but had one thing in common: it was a <i>place</i>, and not just fiber and copper.&quot; </p>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2005-10-26#882">
  <rss:title>Breaking the Web Wide Open! </rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2005-10-26T19:28:47Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Marc Canter&#39;s Breaking the Web Wide Open! article is something I found pretty late (by my normal discovery standards). This was partly due to the pre- and post- Web 2.0 event noise levels that have dumped the description of an important industry inflection into the &quot;Bozo Bin&quot; of many. Personally, I think we shouldn&#39;t confuse the Web 2.0 traditional-pitch-fest conference with an attempt to identify an important industry inflection). Anyway, Marc&#39;s article is a very refreshing read because it provides a really good insight into the general landscape of a rapidly evolving Web alongside genuine appreciation of our broader timeless pursuit of &quot;Openness&quot;. To really help this document provide additional value have scrapped the content of the original post and dumped it below so that we can appreciate the value of the links embedded within the article (note: thanks to Virtuoso I only had to paste the content into my blog, the extraction to my Linkblog and Blog Summary Pages are simply features of my Virtuoso based Blog Engine):Breaking the Web Wide Open! (complete story)Even the web giants like AOL, Google, MSN, and Yahoo need to observe these open standards, or they&#39;ll risk becoming the &quot;walled gardens&quot; of the new web and be coolio no more.Marc Canter [Broadband Mechanics, Inc.] | POSTED: 09.26.05 @12:00Editorial Note: Several months ago, AlwaysOn got a personal invitation from Yahoo founder Jerry Yang &quot;to see and give us feedback on our new social media product, y!360.&quot; We were happy to oblige and dutifully showed up, joining a conference room full of hard-core bloggers and new, new media types. The geeks gave Yahoo 360 an overwhelming thumbs down, with comments like, &quot;So the only services I can use within this new network are Yahoo services? What if I don&#39;t use Yahoo IM?&quot; In essence, the Yahoo team was booed for being &quot;closed web,&quot; and we heartily agreed. With Yahoo 360, Yahoo continues building its own &quot;walled garden&quot; to control its 135 million customersÂan accusation also hurled at AOL in the early 1990s, before AOL migrated its private network service onto the web. As theÂ  Economist recently noted, &quot;Yahoo, in short, has old media plans for the new-media era.&quot;The irony to our view here is, of course, that today&#39;s AO Network is also a &quot;closed web.&quot; In the end, Mr. Yang&#39;s thoughtful invitation and our ensuing disappointment in his new service led to the assignment of this article. It also confirmed our existing plan to completely revamp the AO Network around open standards. To tie it all together, we recruited the chief architect of our new site, the notorious Marc Canter, to pen this piece. We look forward to our reader feedback.Breaking the Web Wide Open!By Marc CanterFor decades, &quot;walled gardens&quot; of proprietary standards and content have been the strategy of dominant players in mainframe computer software, wireless telecommunications services, and the World Wide WebÂit was their successful lock-in strategy of keeping their customers theirs. But like it or not, those walls are tumbling down. Open web standards are being adopted so widely, with such value and impact, that the web giantsÂAmazon, AOL, eBay, Google, Microsoft, and YahooÂare facing the difficult decision of opening up to what they don&#39;t control.The online world is evolving into a new open web (sometimes called the Web 2.0), which is all about being personalized and customized for each user. Not only open source software, but open standardsÂ are becoming an essential component. Many of the web giants have been using open source software for years. Most of them use at least parts of the LAMP (Linux, Apache, MySQL, Perl/Python/PHP) stack, even if they aren&#39;t well-known for giving back to the open source community. For these incumbents that grew big on proprietary web services, the methods, practices, and applications of open source software development are difficult to fully adopt. And the next open source movementsÂwhich will be as much about open standards as about codeÂwill be a lot harder for the incumbents to exploit.While the incumbents use cheap open source software to run their back-ends systems, their business models largely depend on proprietary software and algorithms. But our view a new slew of open software, open protocols, and open standards will confront the incumbents with the classic Innovator&#39;s Dilemma.Â  Should they adopt these tools and standards, painfully cannibalizing their existing revenue for a new unproven concept, or should they stick with their currently lucrative model with the risk that eventually a bunch of upstarts eat their lunch? Credit should go to several of the web giants who have been making efforts to &quot;open up.&quot; Google, Yahoo, eBay, and Amazon all have Open APIs (Application Programming Interfaces) built into their data and systems. Any software developer can access and use them for whatever creative purposes they wish. This means that the API provider becomes an open platform for everyone to use and build on top of. This notion has expanded like wildfire throughout the blogosphere, so nowadays, Open APIs are pretty much required.Other incumbents also have open strategies. AOL has got the RSS religion, providing a feedreader and RSS search in order to escape the &quot;walled garden of content&quot; stigma. Apple now incorporates podcasts, the &quot;personal radio shows&quot; that are latest rage in audio narrowcasting, into iTunes. Even Microsoft is supporting open standards, for example by endorsing SIP (Session Initiation Protocol) for internet telephony and conferencing over Skype&#39;s proprietary format or one of its own devising.But new open standards and protocols are in use, under construction, or being proposed every day, pushing the envelope of where we are right now. Many of these standards are coming from startup companies and small groups of developers, not from the giants. Together with the Open APIs, those new standards will contribute to a new, open infrastructure. Tens of thousands of developers will use and improve this open infrastructure to create new kinds of web-based applications and services, to offer web users a highly personalized online experience.A Brief History of OpennessAt this point, I have to admit that I am not just a passive observer, full-time journalist or &quot;just some blogger&quot;Âbut an active evangelist and developer of these standards. It&#39;s the vision of &quot;open infrastructure&quot; that&#39;s driving my company and the reason why I&#39;m writing this article. This article will give you some of the background behind on these standards, and what the evolution of the next generation of open standards will look like.Starting back in the 1980s, establishing a software standard was a key strategy for any software company. My former company, MacroMind (which became Macromedia), achieved this goal early on with Director. As Director evolved into Flash, the world saw that other companies besides Microsoft, Adobe, and Apple could establish true cross-platform, independent media standards.Then Tim Berners-Lee and Marc Andreessen came along, and changed the rules of the software business and of entrepreneurialism. No matter how entrenched and &quot;standardized&quot; software was, the rug could still get pulled out from under it. Netscape did it to Microsoft, and then Microsoft did it backÂ  to Netscape. The web evolved, and lots of standards evolved with it. The leading open source standards (such as the LAMP stack) became widely used alternatives to proprietary closed-source offerings. Open standards are more than just technology. Open standards mean sharing, empowering, and community support. Someone floats a new idea (or meme) and the community runs with it â with each person making their own contributions to the standard â evolving it without a moment&#39;s hesitation about &quot;giving away their intellectual property.&quot;One good example of this was Dave Sifry, who built the Technorati blog-tracking technology inspired by the Blogging Ecosystem, a weekend project by young hacker Phil Pearson. Dave liked what he saw and he ran with itÂturning Technorati into what it is today.Dave Winer has contributed enormously to this area of open standards. He defined and personally created several open standards and protocolsÂsuch as RSS, OPML, and XML-RPC. Dave has also helped build the blogosphere through his enthusiasm and passion.By 2003, hundreds of programmers were working on creating and establishing new standards for almost everything. The best of these new standards have evolved into compelling web services platforms â such as del.icio.us, Webjay, or Flickr. Some have even spun off formal standards â like XSPF (a standard for playlists) or instant messaging standard XMPP (also known as Jabber).Today&#39;s Open APIs are complemented by standardized SchemasÂthe structure of the data itself and its associated meta-data. Take for example a podcasting feed. It consists of: a) the radio show itself, b) information on who is on the show, what the show is about and how long the show is (the meta-data) and also c) API calls to retrieve a show (a single feed item) and play it from a specified server. The combination of Open APIs, standardized schemas for handling meta-data, and an industry which agrees on these standards are breaking the web wide open right now. So what new open standards should the web incumbentsÂand youÂbe watching? Keep an eye on the following developments:IdentityAttentionOpen MediaMicrocontent PublishingOpen Social NetworksTagsPinging RoutingOpen CommunicationsDevice Management and Control1. IdentityRight now, you don&#39;t really control your own online identity. At the core of just about every online piece of software is a membership system. Some systems allow you to browse a site anonymouslyÂbut unless you register with the site you can&#39;t do things like search for an article, post a comment, buy something, or review it. The problem is that each and every site has its own membership system. So you constantly have to register with new systems, which cannot share dataÂeven you&#39;d want them to. By establishing a &quot;single sign-on&quot; standard, disparate sites can allow users to freely move from site to site, and let them control the movement of their personal profile data, as well as any other data they&#39;ve created. With Passport, Microsoft unsuccessfully attempted to force its proprietary standard on the industry. Instead, a world is evolving where most people assume that users want to control their own data, whether that data is their profile, their blog posts and photos, or some collection of their past interactions, purchases, and recommendations. As long as users can control their digital identity, any kind of service or interaction can be layered on top of it.Identity 2.0 is all about users controlling their own profile data and becoming their own agents. This way the users themselves, rather than other intermediaries, will profit from their ID info. Once developers start offering single sign-on to their users, and users have trusted places to store their dataÂwhich respect the limits and provide access controls over that data, users will be able to access personalized services which will understand and use their personal data.Identity 2.0 may seem like some geeky, visionary future standard that isn&#39;t defined yet, but by putting each user&#39;s digital identity at the core of all their online experiences, Identity 2.0 is becoming the cornerstone of the new open web. The Initiatives:Right now, Identity 2.0 is under construction through various efforts from Microsoft (the &quot;InfoCard&quot; component built into the Vista operating system and its &quot;Identity Metasystem&quot;), Sxip Identity, Identity Commons, Liberty Alliance, LID (NetMesh&#39;s Lightweight ID), and SixApart&#39;s OpenID.More Movers and Shakers:Identity Commons and Kaliya Hamlin, Sxip Identity and Dick Hardt, the Identity Gang and Doc Searls, Microsoft&#39;s Kim Cameron, Craig Burton, Phil Windley, and Brad Fitzpatrick, to name a few.2. AttentionHow many readers know what their online attention is worth? If you don&#39;t, Google and Yahoo doÂthey make their living off our attention. They know what we&#39;re searching for, happily turn it into a keyword, and sell that keyword to advertisers. They make money off our attention. We don&#39;t. Technorati and friends proposed an attention standard, Attention.xml, designed to &quot;help you keep track of what you&#39;ve read, what you&#39;re spending time on, and what you should be paying attention to.&quot; AttentionTrust is an effort by Steve Gillmor and Seth Goldstein to standardize on how captured end-user performance, browsing, and interest data are used. Blogger Peter Caputa gives a good summary of AttentionTrust: &quot;As we use the web, we reveal lots of information about ourselves by what we pay attention to. Imagine if all of that information could be stored in a nice neat little xml file. And when we travel around the web, we can optionally share it with websites or other people. We can make them pay for it, lease it ... we get to decide who has access to it, how long they have access to it, and what we want in return. And they have to tell us what they are going to do with our Attention data.&quot;So when you give your attention to sites that adhere to the AttentionTrust, your attention rights (you own your attention, you can move your attention, you can pay attention and be paid for it,Â  and you can see how your attention is used) are guaranteed. Attention data is crucial to the future of the open web, and Steve and Seth are making sure that no one entity or oligopoly controls it. Movers and Shakers:Steve Gillmor, Seth Goldstein, Dave Sifry and the other Attention.xml folks. 3. Open MediaProprietary media standardsÂFlash, Windows Media, and QuickTime, to name a few Âhelped liven up the web. But they are proprietary standards that try to keep us locked in, and they weren&#39;t created from scratch to handle today&#39;s online content. That&#39;s why, for many of us, an Open Media standard has been a holy grail. Yahoo&#39;s new Media RSS standard brings us one step closer to achieving open media, as do Ogg Vorbis audio codecs, XSPF playlists, or MusicBrainz. And several sites offer digital creators not only a place to store their content, but also to sell it. Media RSS (being developed by Yahoo with help from the community) extends RSS and combines it with &quot;RSS enclosures&quot; Âadds metadata to any media itemÂto create a comprehensive solution for media &quot;narrowcasters.&quot; To gain acceptance for Media RSS, Yahoo knows it has to work with the community. As an active member of this community, I can tell you that we&#39;ll create Media RSS equivalents for rdf (an alternative subscription format) and Atom (yet anotherÂ  subscription format), so no one will be able to complain that Yahoo is picking sides in format wars.When Yahoo announced the purchase of Flickr, Yahoo founder Jerry Yang insinuated that Yahoo is acquiring &quot;open DNA&quot; to turn Yahoo into an open standards player. Yahoo is showing what happens when you take a multi-billion dollar company and make openness one of its core valuesÂso Google, beware, even if Google does have more research fellows and Ph.D.s. The open media landscape is far and wide, reaching from game machine hacks and mobile phone downloads to PC-driven bookmarklets, players, and editors, and it includes many other standardization efforts. XSPF is an open standard for playlists, and MusicBrainz is an alternative to the proprietary (and originally effectively stolen) database that Gracenote licenses. Ourmedia.org is a community front-end to Brewster Kahle&#39;s Internet Archive. Brewster has promised free bandwidth and free storage forever to any content creators who choose to share their content via the Internet Archive. Ourmedia.org is providing an easy-to-use interface and community to get content in and out of the Internet Archive, giving ourmedia.org users the ability to share their media anywhere they wish, without being locked into a particular service or tool. Ourmedia plans to offer open APIs and an open media registry that interconnects other open media repositories into a DNS-like registry (just like the www domain system), so folks can browse and discover open content across many open media services. Systems like Brightcove and Odeo support the concept of an open registry, and hope to work with digital creators to sell their work to fulfill the financial aspect of the &quot;Long Tail.&quot;More Movers and Shakers:Creative Commons, the Open Media Network, Jay Dedman, Ryanne Hodson, Michael Verdi, Eli Chapman, Kenyatta Cheese, Doug Kaye, Brad Horowitz, Lucas Gonze, Robert Kaye, Christopher Allen, Brewster Kahle, JD Lasica, and indeed, Marc Canter, among others.4. Microcontent PublishingUnstructured content is cheap to create, but hard to search through. Structured content is expensive to create, but easy to search. Microformats resolve the dilemma with simple structures that are cheap to use and easy to search.The first kind of widely adopted microcontent is blogging. Every post is an encapsulated idea, addressable via a URL called a permalink. You can syndicate or subscribe to this microcontent using RSS or an RSS equivalent, and news or blog aggregators can then display these feeds in a convenient readable fashion. But a blog post is just a block of unstructured textânot a bad thing, but just a first step for microcontent. When it comes tostructuredÂ data, such as personal identity profiles, product reviews, or calendar-type event data, RSS was not designed to maintain the integrity of the structures. Right now, blogging doesn&#39;t have the underlying structure necessary for full-fledged microcontent publishing. But that will change. Think of local information services (such as movie listings, event guides, or restaurant reviews) that any college kid can access and use in her weekend programming project to create new services and tools.Today&#39;s blogging tools will evolve into microcontent publishing systems, and will help spread the notion of structured data across the blogosphere. New ways to store, represent and produce microcontent will create new standards, such as Structured Blogging and Microformats. Microformats differ from RSS feeds in that you can&#39;t subscribe to them. Instead, Microformats are embedded into webpages and discovered by search engines like Google or Technorati. Microformats are creating common definitions for &quot;What is a review or event? What are the specific fields in the data structure?&quot; They can also specify what we can do with all this information.OPML (Outline Processor Markup Language) is a hierarchical file format for storing microcontent and structured data. It was developed by Dave Winer of RSS and podcast fame.Events are one popular type of microcontent. OpenEvents is already working to create shared databases of standardized events, which would get used by a new generation of event portalsâsuch as Eventful/EVDB, Upcoming.org, and WhizSpark. The idea of OpenEvents is that event-oriented systems and services can work together to establish shared events databases (and associated APIs) that any developer could then use to create and offer their own new service or application. OpenReviews is still in the conceptual stage, but it would make it possible to provide open alternatives to closed systems like Epinions, and establish a shared database of local and global reviews. Its shared open servers would be filled with all sorts of reviews for anyone to access. Why is this important? Because I predict that in the future, 10 times more people will be writing reviews than maintaining their own blog. The list of possible microcontent standards goes on: OpenJobpostings, OpenRecipes, and even OpenLists. Microsoft recently revealed that it has been working on an important new kind of microcontent: Listsâso OpenLists will attempt to establish standards for the kindÂ of lists we all use, such as lists of Links, lists of To Do Items, lists of People, Wish Lists, etc.Movers and Shakers:Tantek Ãelik and Kevin Marks of Technorati, Danny Ayers, Eric Meyer, Matt Mullenweg, Rohit Khare, Adam Rifkin, Arnaud Leene, Seb Paquet, Alf Eaton, Phil Pearson, Joe Reger, Bob Wyman among others.5. Open Social NetworksI&#39;ll never forget the first time I met Jonathan Abrams, the founder of Friendster. He was arrogant and brash and he claimed he &quot;owned&quot;Â  all his users, and that he was going to monetize them and make a fortune off them. This attitude robbed Friendster of its momentum, letting MySpace, Facebook, and other social networks take Friendster&#39;s place.Jonathan&#39;s notion of social networks as a way to control users is typical of the Web 1.0 business model and its attitude towards users in general. Social networks have become one of the battlegrounds between old and new ways of thinking. Open standards for Social Networking will define those sides very clearly. Since meeting Jonathan, I have been working towards finding and establishing open standards for social networks. Instead of closed, centralized social networks with 10 million people in them, the goal is making it possible to have 10 million social networks that each have 10 people in them.FOAF (which stands for Friend Of A Friend, and describes people and relationships in a way that computers can parse) is a schema to represent not only your personal profile&#39;s meta-data, but your social network as well. Thousands of researchers use the FOAF schema in their &quot;Semantic Web&quot; projects to connect people in all sorts of new ways. XFN is a microformat standard for representing your social network, while vCard (long familiar to users of contact manager programs like Outlook) is a microformat that contains your profile information. Microformats are baked into any xHTML webpage, which means thatanyÂ blog, social network page, or any webpage in general can &quot;contain&quot; your social network in itÂand be used byanyÂ compatible tool, service or application. PeopleAggregator is an earlier project now being integrated into open content management framework Drupal. The PeopleAggregator APIs will make it possible to establish relationships, send messages, create or join groups, and post between different social networks. (Sneak preview: this technology will be available in the upcoming GoingOn Network.) All of these open social networking standards mean that inter-connected social networks will form a mesh that will parallel the blogosphere. This vibrant, distributed, decentralized world will be driven by open standards: personalized online experiences are what the new open web will be all aboutÂand what could be more personalized than people&#39;s networks?Movers and Shakers:Eric Sigler, Joel De Gan, Chris Schmidt, Julian Bond, Paul Martino, Mary Hodder, Drummond Reed, Dan Brickley, Randy Farmer, and Kaliya Hamlin, to name a few.6. TagsNowadays, no self-respecting tool or service can ship without tags. Tags are keywords or phrases attached to photos, blog posts, URLs, or even video clips. These user- and creator-generated tags are an open alternative to what used to be the domain of librarians and information scientists: categorizing information and content using taxonomies. Tags are instead creating &quot;folksonomies.&quot;The recently proposed OpenTags concept would be an open, community-owned version of the popular Technorati Tags service. It would aggregate the usage of tags across a wide range of services, sites, and content tools. In addition to Technorati&#39;s current tag features, OpenTags would let groups of people share their tags in &quot;TagClouds.&quot; Open tagging is likely to include some of the open identity features discussed above, to create a tag system that is resilient to spam, and yet trustable across sites all over the web.OpenTags owes a debt to earlier versions of shared tagging systems, which include Topic Exchange and something called the k-collectorÂa knowledge management tag aggregatorÂfrom Italian company eVectors. Movers &amp; Shakers:Phil Pearson, Matt Mower , Paolo Valdemarin, and Mary Hodder and Drummond Reed again, among others.7. PingingWebsites used to be mostly static. Search engines that crawled (or &quot;spidered&quot;) them every so often did a good enough job to show reasonably current versions of your cousin&#39;s homepage or even TimeÂ magazine&#39;s weekly headlines. But when blogging took off, it became hard for search engines to keep up. (Google has only just managed to offer blog-search functionality, despite buying Blogger back in early 2003.)To know what was new in the blogosphere, users couldn&#39;t depend on services that spidered webpages once in a while. The solution: a way for blogs themselves to automatically notify blog-tracking sites that they&#39;d been updated. Weblogs.com was the first blog &quot;ping service&quot;: it displayed the name of a blog whenever that blog was updated. Pinging sites helped the blogosphere grow, and more tools, services, and portals started using pinging in new and different ways. Dozens of pinging services and sitesÂmost of which can&#39;t talk to each otherÂsprang up. Matt Mullenweg (the creator of open source blogging software WordPress) decided that a one-stop service for pinging was needed. He created Ping-o-MaticÂwhich aggregates ping services and simplifies the pinging process for bloggers and tool developers. With Ping-o-Matic, any developer can alert all of the industry&#39;s blogging tools and tracking sites at once. This new kind of open standard, with shared infrastructure, is a critical to the scalability of Web 2.0 services.As Matt said:There are a number of services designed specifically for tracking and connecting blogs. However it would be expensive for all the services to crawl all the blogs in the world all the time. By sending a small ping to each service you let them know you&#39;ve updated so they can come check you out. They get the freshest data possible, you don&#39;t get a thousand robots spidering your site all the time. Everybody wins.Movers and Shakers:Matt Mullenweg, Jim Winstead, Dave Winer8. RoutingBloggers used to have to manually enter the links and content snippets of blog posts or news items they wanted to blog. Today, some RSS aggregators can send a specified post directly into an associated blogging tool: as bloggers browse through the feeds they subscribe to, they can easily specify and send any post they wish to &quot;reblog&quot; from their news aggregator or feed reader into their blogging tool. (This is usually referred to as &quot;BlogThis.&quot;) As structured blogging comes into its own (see the section on Microcontent Publishing), it will be increasingly important to maintain the structural integrity of these pieces of microcontent when reblogging them. Promising standard RedirectThis will combine a &quot;BlogThis&quot;-like capability while maintaining the integrity of the microcontent. RedirectThis will let bloggers and content developers attach a simple &quot;PostThis&quot; button to their posts. Clicking on that button will send that post to the reader/blogger&#39;s favorite blogging tool. This favorite tool is specified at the RedirectThis web service, where users register their blogging tool of choice. RedirectThis also helps maintain the integrity and structure of microcontentÂthen it&#39;s just up to the user to prefer a blogging tool that also attains that lofty goal of microcontent integrity. OutputThis is another nascent web services standard, to let bloggers specify what &quot;destinations&quot; they&#39;d like to have as options in their blogging tool. As new destinations are added to the service, more checkboxes would get added to their blogging toolÂallowing them to route their published microcontent to additional destinations.Movers and Shakers:Michael Migurski, Lucas Gonze9. Open CommunicationsLikely, you&#39;ve experienced the joys of finding friends on AIM or Yahoo Messenger, or the convenience of Skyping with someone overseas. Not that you&#39;re about to throw away your mobile phone or BlackBerry, but for many, also having access to Instant Messaging (IM) and Voice over IP (VoIP) is crucial. IM and VoIP are mainstream technologies that already enjoy the benefits of open standards. Entire industries are bornÂright this secondÂbased around these open standards. Jabber has been an open IM technology for yearsÂin fact, as XMPP, it was officially dubbed a standard by the IETF. Although becoming an official IETF standard is usually the kiss of death, Jabber looks like it&#39;ll be around for a while, as entire generations of collaborative, work-group applications and services have been built on top of its messaging protocol. For VoIP, Skype is clearly the leading standard todayÂthough one could argue just how &quot;open&quot; it is (and defenders of the IETF&#39;s SIP standard often do). But it is free and user-friendly, so there won&#39;t be much argument from usersÂ  about it being insufficiently open. Yet there may be a cloud on Skype&#39;s horizon: web behemoth Google recently released a beta of Google Talk, an IM client committed to open standards. It currently supports XMPP, and will support SIP for VoIP calls.Movers and Shakers:Jeremie Miller, Henning Schulzrinne, Jon Peterson, Jeff Pulver10. Device Management and ControlTo access online content, we&#39;re using more and more devices. BlackBerrys, iPods, Treos, you name it. As the web evolves, more and more different devices will have to communicate with each other to give us the content we want when and where we want it. No-one wants to be dependent on one vendor anymoreÂlike, say, SonyÂfor their laptop, phone, MP3 player, PDA, and digital camera, so that it all works together. We need fully interoperable devices, and the standards to make that work. And to fully make use of how content is moving online content and innovative web services, those standards need to be open.MIDI (musical instrument digital interface), one of the very first open standards in music, connected disparate vendors&#39; instruments, post-production equipment, and recording devices. But MIDI is limited, and MIDI II has been very slow to arrive. Now a new standard for controlling musical devices has emerged: OSC (Open SoundControl). This protocol is optimized for modern networking technology and inter-connects music, video and controller devices with &quot;other multimedia devices.&quot; OSC is used by a wide range of developers, and is being taken up in the mainstream MIDI marketplace.Another open-standards-based device management technology is ZigBee, for building wireless intelligence and network monitoring into all kinds of devices. ZigBee is supported by many networking, consumer electronics, and mobile device companies.Â  Â  Â  Â· Â· Â· Â· Â· Â· Â  Â  The Change to OpennessThe rise of open source software and its &quot;architecture of participation&quot; are completely shaking up the old proprietary-web-services-and-standards approach. Sun MicrosystemsÂwhose proprietary Java standard helped define the Web 1.0Âis opening its Solaris OS and has even announced the apparent paradox of an open-source Digital Rights Management system.Today&#39;s incumbents will have to adapt to the new openness of the Web 2.0. If they stick to their proprietary standards, code, and content, they&#39;ll become the new walled gardensÂplaces users visit briefly to retrieve data and content from enclosed data silos, but not where users &quot;live.&quot; The incumbents&#39; revenue models will have to change. Instead of &quot;owning&quot; their users, users will know they own themselves, and will expect a return on their valuable identity and attention. Instead of being locked into incompatible media formats, users will expect easy access to digital content across many platforms. Yesterday&#39;s web giants and tomorrow&#39;s users will need to find a mutually beneficial new balanceÂbetween open and proprietary, developer and user, hierarchical and horizontal, owned and shared, and compatible and closed. Marc Canter is an active evangelist and developer of open standards. Early in his career, Marc founded MacroMind, which became Macromedia. These days, he is CEO of Broadband Mechanics, a founding member of the Identity Gang and of ourmedia.org. Broadband Mechanics is currently developing the GoingOn Network (with the AlwaysOn Network), as well as an open platform for social networking called the PeopleAggregator.A version of the above post appears in the Fall 2005 issue of AlwaysOn&#39;s quarterly print blogozine, and ran as a four-part series on the AlwaysOn Network website.(Via Marc&#39;s Voice.)</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p><a href="http://marc.blogs.it/">Marc Canter</a>&#39;s <a href="http://marc.blogs.it/archives/2005/10/breaking_the_we.html">Breaking the Web Wide Open! </a> article is something I found pretty late (by my normal discovery standards). This was partly due to the pre- and post- Web 2.0 event noise levels that have dumped the description of an important industry inflection into the &quot;Bozo Bin&quot; of many. Personally, I think we shouldn&#39;t confuse the Web 2.0 traditional-pitch-fest conference with an attempt to identify an important industry inflection).</p><p> Anyway, Marc&#39;s article is a very refreshing read because it provides a really good insight into the general landscape of a rapidly evolving Web alongside genuine appreciation of our broader timeless pursuit of &quot;Openness&quot;. </p><p>To really help this document provide additional value have scrapped the content of the original post and dumped it below so that we can appreciate the value of the links embedded within the article (note: thanks to Virtuoso I only had to paste the content into my blog, the extraction to my <a href="http://www.openlinksw.com/blog/~kidehen/index.vspx?page=linkblog">Linkblog</a> and <a href="http://www.openlinksw.com/blog/~kidehen/index.vspx?page=summary">Blog Summary</a> Pages are simply features of my <a href="http://www.openlinksw.com/virtuos">Virtuoso </a>based Blog Engine):</p><blockquote><h3 class="hed2" style="padding-bottom: 10px">Breaking the Web Wide Open! (complete story)</h3><p>Even the web giants like AOL, Google, MSN, and Yahoo need to observe these open standards, or they&#39;ll risk becoming the &quot;walled gardens&quot; of the new web and be coolio no more.</p><p class="byline"><b><a href="http://community.alwayson-network.com/cgi-bin/WebObjects/AlwaysOn.woa/wa/display?id=9254:Person">Marc Canter</a></b> [<a href="http://community.alwayson-network.com/cgi-bin/WebObjects/AlwaysOn.woa/wa/display?id=9254:Person"><b>Broadband Mechanics, Inc.</b></a>] | POSTED: 09.26.05 @12:00</p><table width="100%" border="0" cellspacing="0" cellpadding="0"><tr><td valign="TOP" class="copy1"><img src="http://community.alwayson-network.com/ao/images/thumb/19433429363e7cd6b1ecfb7.jpg" align="LEFT" border="0" width="80" style="margin: 0px 10px 5px 0px" alt="" /><i><b>Editorial Note:</b> Several months ago, AlwaysOn got a personal invitation from Yahoo founder Jerry Yang &quot;to see and give us feedback on our new social media product, y!360.&quot; We were happy to oblige and dutifully showed up, joining a conference room full of hard-core bloggers and new, new media types. The geeks gave Yahoo 360 an overwhelming thumbs down, with comments like, &quot;So the only services I can use within this new network are Yahoo services? What if I don&#39;t use Yahoo IM?&quot; In essence, the Yahoo team was booed for being &quot;closed web,&quot; and we heartily agreed. With Yahoo 360, Yahoo continues building its own &quot;walled garden&quot; to control its 135 million customersÂan accusation also hurled at AOL in the early 1990s, before AOL migrated its private network service onto the web. As the</i>Â  <a href="http://bernardmoon.blogspot.com/2005/08/yahoos-personality-crisis.html" target="_blank">Economist<i> recently noted</i></a>, &quot;Yahoo, in short, has old media plans for the new-media era.&quot;<br /><br />The irony to our view here is, of course, that today&#39;s AO Network is also a &quot;closed web.&quot; In the end, Mr. Yang&#39;s thoughtful invitation and our ensuing disappointment in his new service led to the assignment of this article. It also confirmed our existing plan to completely revamp the AO Network around open standards. To tie it all together, we recruited the chief architect of our new site, <a href="http://www.corante.com/amateur/articles/20030211-3564.html" target="_blank">the notorious Marc Canter</a>, to pen this piece. We look forward to our reader feedback.<br /><br /><b>Breaking the Web Wide Open!</b><br />By Marc Canter<br /><br />For decades, &quot;walled gardens&quot; of proprietary standards and content have been the strategy of dominant players in mainframe computer software, wireless telecommunications services, and the World Wide WebÂit was their successful lock-in strategy of keeping their customers theirs. But like it or not, those walls are tumbling down. Open web standards are being adopted so widely, with such value and impact, that the web giantsÂAmazon, AOL, eBay, Google, Microsoft, and YahooÂare facing the difficult decision of opening up to what they don&#39;t control.<br /><br />The online world is evolving into a new open web (sometimes called the Web 2.0), which is all about being personalized and customized for each user. Not only open source software, but <i>open standards</i>Â are becoming an essential component. <br /><br />Many of the web giants have been using open source software for years. Most of them use at least parts of the <a href="http://www.onlamp.com/pub/a/onlamp/2001/01/25/lamp.html" target="_blank">LAMP</a> (Linux, Apache, MySQL, Perl/Python/PHP) stack, even if they aren&#39;t well-known for giving back to the open source community. For these incumbents that grew big on proprietary web services, the methods, practices, and applications of open source software development are difficult to fully adopt. And the next open source movementsÂwhich will be as much about open standards as about codeÂwill be a lot harder for the incumbents to exploit.<br /><br />While the incumbents use cheap open source software to run their back-ends systems, their business models largely depend on proprietary software and algorithms. But our view a new slew of open software, open protocols, and open standards will confront the incumbents with the classic <i><a href="http://www.businessweek.com/chapter/christensen.htm" target="_blank">Innovator&#39;s Dilemma</a></i>.Â  Should they adopt these tools and standards, painfully cannibalizing their existing revenue for a new unproven concept, or should they stick with their currently lucrative model with the risk that eventually a bunch of upstarts eat their lunch? <br /><br />Credit should go to several of the web giants who have been making efforts to &quot;open up.&quot; Google, Yahoo, eBay, and Amazon all have Open APIs (Application Programming Interfaces) built into their data and systems. Any software developer can access and use them for whatever creative purposes they wish. This means that the API provider becomes an open platform for everyone to use and build on top of. This notion has expanded like wildfire throughout the blogosphere, so nowadays, Open APIs are pretty much required.<br /><br />Other incumbents also have open strategies. AOL has got the RSS religion, <a href="http://www.siliconbeat.com/entries/2005/07/27/aol_gets_rss_religion_with_my_aoland_feedsters_help.html" target="_blank">providing a feedreader and RSS search</a> in order to escape the &quot;walled garden of content&quot; stigma. <a href="http://www.apple.com/podcasting/" target="_blank">Apple now incorporates podcasts</a>, the &quot;personal radio shows&quot; that are latest rage in audio narrowcasting, into iTunes. Even Microsoft is supporting open standards, for example <a href="http://www.microsoft.com/technet/prodtechnol/winxppro/plan/rtcprot.mspx#EKAA" target="_blank">by endorsing SIP (Session Initiation Protocol) for internet telephony and conferencing</a> over Skype&#39;s proprietary format or one of its own devising.<br /><br />But new open standards and protocols are in use, under construction, or being proposed every day, pushing the envelope of where we are right now. Many of these standards are coming from startup companies and small groups of developers, not from the giants. Together with the Open APIs, those new standards will contribute to a new, open infrastructure. Tens of thousands of developers will use and improve this open infrastructure to create new kinds of web-based applications and services, to offer web users a highly personalized online experience.<br /><br /><b>A Brief History of Openness</b><br /><br />At this point, I have to admit that I am not just a passive observer, full-time journalist or &quot;just some blogger&quot;Âbut an active evangelist and developer of these standards. It&#39;s the vision of &quot;open infrastructure&quot; that&#39;s driving <a href="http://www.broadbandmechanics.com/bbm2005.htm" target="_blank">my company </a> and the reason why I&#39;m writing this article. This article will give you some of the background behind on these standards, and what the evolution of the next generation of open standards will look like.<br /><br />Starting back in the 1980s, establishing a software standard was a key strategy for any software company. My former company, MacroMind (which became Macromedia), achieved this goal early on with Director. As <a href="http://webmonkey.wired.com/webmonkey/99/27/index3a_page6.html?tw=multimedia" target="_blank">Director evolved into Flash</a>, the world saw that other companies besides Microsoft, Adobe, and Apple could establish true cross-platform, independent media standards.<br /><br />Then <a href="http://www.w3.org/People/Berners-Lee/" target="_blank">Tim Berners-Lee</a> and <a href="http://www.ibiblio.org/pioneers/andreesen.html" target="_blank">Marc Andreessen</a> came along, and changed the rules of the software business and of entrepreneurialism. No matter how entrenched and &quot;standardized&quot; software was, the rug could still get pulled out from under it. <a href="http://geekphilosopher.com/MainPage/WebBrowserWars.htm?q=Stocks" target="_blank">Netscape did it to Microsoft, and then Microsoft did it <i>back</i>Â  to Netscape</a>. The web evolved, and lots of standards evolved with it. The leading open source standards (such as the LAMP stack) became widely used alternatives to proprietary closed-source offerings. <br /><br />Open standards are more than just technology. Open standards mean sharing, empowering, and community support. Someone floats a new idea (or <a href="http://en.wikipedia.org/wiki/Meme" target="_blank">meme</a>) and the community runs with it â with each person making their own contributions to the standard â evolving it without a moment&#39;s hesitation about &quot;giving away their intellectual property.&quot;<br /><br />One good example of this was <a href="http://www.sifry.com/alerts/" target="_blank">Dave Sifry</a>, who built the Technorati blog-tracking technology inspired by the <a href="http://www.myelin.co.nz/ecosystem/" target="_blank">Blogging Ecosystem</a>, a weekend project by young hacker <a href="http://marc.blogs.it/archives/2005/07/phil_pearson_jo.html" target="_blank">Phil Pearson</a>. Dave liked what he saw and he ran with itÂturning Technorati into what it is today.<br /><br /><a href="http://en.wikipedia.org/wiki/Dave_Winer" target="_blank">Dave Winer</a> has contributed enormously to this area of open standards. He defined and personally created several open standards and protocolsÂsuch as RSS, OPML, and XML-RPC. Dave has also <a href="http://newhome.weblogs.com/historyOfWeblogs" target="_blank">helped build</a> the blogosphere through his enthusiasm and passion.<br /><br />By 2003, hundreds of programmers were working on creating and establishing new standards for almost everything. The best of these new standards have evolved into compelling web services platforms â such as <a href="http://del.icio.us/" target="_blank">del.icio.us</a>, <a href="http://webjay.org/about" target="_blank">Webjay</a>, or <a href="http://www.flickr.com/photos/tags/ao2005/" target="_blank">Flickr</a>. Some have even spun off formal standards â like XSPF (a standard for playlists) or instant messaging standard XMPP (also known as Jabber).<br /><br />Today&#39;s Open APIs are complemented by standardized SchemasÂthe structure of the data itself and its associated meta-data. Take for example a <a href="http://www.ipodder.org/whatIsPodcasting" target="_blank">podcasting feed</a>. It consists of: a) the radio show itself, b) information on who is on the show, what the show is about and how long the show is (the meta-data) and also c) API calls to retrieve a show (a single feed item) and play it from a specified server. <br /><br />The combination of Open APIs, standardized schemas for handling meta-data, and an industry which agrees on these standards are breaking the web wide open right now. So what new open standards should the web incumbentsÂand youÂbe watching? Keep an eye on the following developments:<br /><br /><b>Identity<br />Attention<br />Open Media<br />Microcontent Publishing<br />Open Social Networks<br />Tags<br />Pinging <br />Routing<br />Open Communications<br />Device Management and Control</b><br /><br /><br /><b>1.	Identity</b><br /><br />Right now, you don&#39;t really control your own online identity. At the core of just about every online piece of software is a membership system. Some systems allow you to browse a site anonymouslyÂbut unless you register with the site you can&#39;t do things like search for an article, post a comment, buy something, or review it. The problem is that each and every site has its own membership system. So you constantly have to register with new systems, which cannot share dataÂeven you&#39;d want them to. By establishing a <a href="http://www.wired.com/news/privacy/0,1848,68329-2,00.html?tw=wn_story_page_next1" target="_blank">&quot;single sign-on&quot; standard</a>, disparate sites can allow users to freely move from site to site, and let them control the movement of their personal profile data, as well as any other data they&#39;ve created. <br /><br />With <a href="http://www.thehindubusinessline.com/2005/01/03/stories/2005010301440200.htm" target="_blank">Passport, Microsoft unsuccessfully attempted</a> to force its proprietary standard on the industry. Instead, a world is evolving where most people assume that users want to control their own data, whether that data is their profile, their blog posts and photos, or some collection of their past interactions, purchases, and recommendations. As long as users can control their digital identity, any kind of service or interaction can be layered on top of it.<br /><br /><a href="http://www.identity20.com/media/OSCON2005/" target="_blank">Identity 2.0</a> is all about users controlling their own profile data and becoming their own agents. This way the users themselves, rather than other intermediaries, will profit from their ID info. Once developers start offering single sign-on to their users, and users have trusted places to store their dataÂwhich respect the limits and provide access controls over that data, users will be able to access personalized services which will understand and use their personal data.<br /><br />Identity 2.0 may seem like some geeky, visionary future standard that isn&#39;t defined yet, but by putting each user&#39;s digital identity at the core of all their online experiences, Identity 2.0 is becoming the cornerstone of the new open web. <br /><br /><b>The Initiatives:</b><br />Right now, Identity 2.0 is under construction through various efforts from Microsoft (the <a href="http://msdn.microsoft.com/webservices/webservices/understanding/advancedwebservices/default.aspx?pull=/library/en-us/dnwebsrv/html/identitymetasystem.asp" target="_blank">&quot;InfoCard&quot; component built into the Vista operating system</a> and its &quot;<a href="http://garage.docsearls.com/node/605" target="_blank">Identity Metasystem</a>&quot;), <a href="http://sxip.com" target="_blank">Sxip Identity</a>, <a href="http://www.identtycommons.net" target="_blank">Identity Commons</a>, <a href="http://www.projectliberty.org/" target="_blank">Liberty Alliance</a>, <a href="http://lid.netmesh.org/" target="_blank">LID</a> (NetMesh&#39;s Lightweight ID), and SixApart&#39;s <a href="http://openid.net/" target="_blank">OpenID</a>.<br /><br /><b>More Movers and Shakers:</b><br />Identity Commons and <a href="http://www.identitywoman.net" target="_blank">Kaliya Hamlin</a>, Sxip Identity and <a href="http://blame.ca/dick/" target="_blank">Dick Hardt</a>, the <a href="http://www.identitygang.org/" target="_blank"> Identity Gang</a> and <a href="http://www.searls.com/dochome.html#Bio" target="_blank">Doc Searls</a>, Microsoft&#39;s <a href="http://www.identityblog.com/" target="_blank">Kim Cameron</a>, <a href="http://www.craigburton.com/" target="_blank">Craig Burton</a>, <a href="http://phil.windley.org/" target="_blank">Phil Windley</a>, and <a href="http://slashdot.org/article.pl?sid=05/07/05/2020221&from=rss" target="_blank">Brad Fitzpatrick</a>, to name a few.<br /><br /><br /><b>2.	Attention</b><br /><br />How many readers know what their online attention is worth? If you don&#39;t, Google and Yahoo doÂthey make their living off our attention. They know what we&#39;re searching for, happily turn it into a keyword, and sell that keyword to advertisers. They make money off our attention. We don&#39;t. <br /><br />Technorati and friends proposed <a href="http://blogs.zdnet.com/Gillmor/index.php?p=74" target="_blank">an attention standard, Attention.xml</a>, designed to &quot;help you keep track of what you&#39;ve read, what you&#39;re spending time on, and what you should be paying attention to.&quot; <a href="http://attentiontrust.org/" target="_blank">AttentionTrust</a> is an effort by <a href="http://blogs.zdnet.com/Gillmor/?p=132" target="_blank">Steve Gillmor</a> and <a href="http://majestic.typepad.com/seth/2005/07/attentiontrusto.html" target="_blank">Seth Goldstein </a>to standardize on how captured end-user performance, browsing, and interest data are used. <br /><br />Blogger <a href="http://worcester.typepad.com/pc4media/2005/07/attentiontrusto_1.html" target="_blank">Peter Caputa gives a good summary</a> of AttentionTrust: <blockquote>&quot;As we use the web, we reveal lots of information about ourselves by what we pay attention to. Imagine if all of that information could be stored in a nice neat little xml file. And when we travel around the web, we can optionally share it with websites or other people. We can make them pay for it, lease it ... we get to decide who has access to it, how long they have access to it, and what we want in return. And they have to tell us what they are going to do with our Attention data.&quot;</blockquote><br />So when you give your attention to sites that adhere to the AttentionTrust, your attention rights (<i>you own your attention, you can move your attention, you can pay attention and be paid for it</i>,Â  and <i>you can see how your attention is used</i>) are guaranteed. Attention data is crucial to the future of the open web, and Steve and Seth are making sure that no one entity or oligopoly controls it. <br /><br /><b>Movers and Shakers:</b><br /><a href="http://blogs.zdnet.com/Gillmor/" target="_blank">Steve Gillmor</a>, <a href="http://majestic.typepad.com/about.html" target="_blank">Seth Goldstein</a>, <a href="http://www.sifry.com/alerts/" target="_blank">Dave Sifry</a> and the <a href="http://developers.technorati.com/wiki/attentionxml" target="_blank">other Attention.xml folks</a>. <br /><br /><br /><b>3.	Open Media</b><br /><br />Proprietary media standardsÂFlash, Windows Media, and QuickTime, to name a few Âhelped liven up the web. But they are proprietary standards that try to keep us locked in, and they weren&#39;t created from scratch to handle today&#39;s online content. That&#39;s why, for many of us, an Open Media standard has been a holy grail. Yahoo&#39;s new Media RSS standard brings us one step closer to achieving open media, as do <a href="http://www.vorbis.com/faq/#what" target="_blank">Ogg Vorbis</a> audio codecs, <a href="http://webjay.org/" target="_blank">XSPF playlists</a>, or <a href="http://musicbrainz.org/" target="_blank">MusicBrainz</a>. And several sites offer digital creators not only a place to store their content, but also to sell it. <br /><br /><a href="http://search.yahoo.com/mrss" target="_blank">Media RSS </a>(being developed by Yahoo with help from the community) extends RSS and combines it with &quot;RSS enclosures&quot; Âadds metadata to any media itemÂto create a comprehensive solution for media &quot;narrowcasters.&quot; To gain acceptance for Media RSS, Yahoo knows it has to work with the community. As an active member of this community, I can tell you that we&#39;ll create Media RSS equivalents for <a href="http://www.xml.com/pub/a/2001/01/24/rdf.html" target="_blank">rdf</a> (an alternative subscription format) and <a href="http://www.atomenabled.org/" target="_blank">Atom</a> (yet <i>another</i>Â  subscription format), so no one will be able to complain that Yahoo is picking sides in format wars.<br /><br />When Yahoo announced the purchase of Flickr, Yahoo founder Jerry Yang insinuated that Yahoo is acquiring &quot;open DNA&quot; to turn Yahoo into <a href="http://www.flickr.com/services/api/" target="_blank">an open standards player</a>. Yahoo is showing what happens when you take a multi-billion dollar company and make openness one of its core valuesÂso Google, beware, even if Google does have more research fellows and Ph.D.s. <br /><br />The open media landscape is far and wide, reaching from game machine hacks and mobile phone downloads to PC-driven bookmarklets, players, and editors, and it includes many other standardization efforts. <a href="http://www.xspf.org/" target="_blank">XSPF</a> is an open standard for playlists, and MusicBrainz is an alternative to the proprietary (and originally effectively stolen) database that <a href="http://en.wikipedia.org/wiki/Gracenote" target="_blank">Gracenote</a> licenses. <br /><br /><a href="http://www.ourmedia.org/" target="_blank">Ourmedia.org</a> is a community front-end to Brewster Kahle&#39;s <a href="http://www.archive.org" target="_blank">Internet Archive</a>. Brewster has promised free bandwidth and free storage forever to any content creators who choose to share their content via the Internet Archive. Ourmedia.org is providing an easy-to-use interface and community to get content in and out of the Internet Archive, giving ourmedia.org users the ability to share their media anywhere they wish, without being locked into a particular service or tool. Ourmedia plans to offer open APIs and an open media registry that interconnects other open media repositories into a DNS-like registry (just like the www domain system), so folks can browse and discover open content across many open media services. Systems like <a href="http://www.brightcove.com/" target="_blank">Brightcove</a> and <a href="http://www.evhead.com/2005/02/how-odeo-happened.asp" target="_blank">Odeo</a> support the concept of an open registry, and hope to work with digital creators to sell their work to fulfill the financial aspect of <a href="http://en.wikipedia.org/wiki/The_Long_Tail" target="_blank">the &quot;Long Tail.&quot;</a><br /><br /><b>More Movers and Shakers:</b><br /><a href="http://creativecommons.org/about/people" target="_blank">Creative Commons</a>, the <a href="http://www.omn.org/" target="_blank">Open Media Network</a>, <a href="http://www.momentshowing.net/about.html" target="_blank">Jay Dedman</a>, <a href="http://ryanedit.blogspot.com/" target="_blank">Ryanne Hodson</a>, <a href="http://michaelverdi.com/index.php" target="_blank">Michael Verdi</a>, <a href="http://www.chapmanlogic.com/blog/aboutEli.html" target="_blank">Eli Chapman</a>, <a href="http://www.unmediated.org/" target="_blank">Kenyatta Cheese</a>, <a href="http://www.itconversations.com/about.html" target="_blank">Doug Kaye</a>, <a href="http://www.wired.com/wired/archive/13.09/yahoo.html" target="_blank">Brad Horowitz</a>, <a href="http://webjay.org/about#colophon" target="_blank">Lucas Gonze</a>, <a href="http://musicbrainz.org/wd/MusicBrainzBio" target="_blank">Robert Kaye</a>,  <a href="http://www.lifewithalacrity.com/" target="_blank">Christopher Allen</a>, <a href="http://en.wikipedia.org/wiki/Brewster_Kahle" target="_blank">Brewster Kahle</a>, <a href="http://www.newmediamusings.com/" target="_blank">JD Lasica</a>, and indeed, <a href="http://www.corante.com/amateur/articles/20030211-3564.html" target="_blank">Marc Canter</a>, among others.<br /><br /><br /><b>4.	Microcontent Publishing</b><br /><br />Unstructured content is cheap to create, but hard to search through. Structured content is expensive to create, but easy to search. <a href="http://developers.technorati.com/wiki/MicroFormats" target="_blank">Microformats</a> resolve the dilemma with simple structures that are cheap to use and easy to search.<br /><br />The first kind of widely adopted microcontent is blogging. Every post is an encapsulated idea, addressable via a URL called a permalink. You can syndicate or subscribe to this microcontent using RSS or an RSS equivalent, and news or blog aggregators can then display these feeds in a convenient readable fashion. But a blog post is just a block of unstructured textânot a bad thing, but just a first step for microcontent. When it comes to<i>structured</i>Â data, such as personal identity profiles, product reviews, or calendar-type event data, RSS was not designed to maintain the integrity of the structures. <br /><br />Right now, blogging doesn&#39;t have the underlying structure necessary for full-fledged microcontent publishing. But that will change. Think of local information services (such as movie listings, event guides, or restaurant reviews) that any college kid can access and use in her weekend programming project to create new services and tools.<br /><br />Today&#39;s blogging tools will evolve into microcontent publishing systems, and will help spread the notion of structured data across the blogosphere. New ways to store, represent and produce microcontent will create new standards, such as <a href="http://structuredblogging.org/" target="_blank">Structured Blogging</a> and <a href="http://microformats.org/" target="_blank">Microformats</a>. Microformats differ from RSS feeds in that you can&#39;t subscribe to them. Instead, Microformats are embedded into webpages and discovered by search engines like Google or Technorati. Microformats are creating common definitions for &quot;What is a review or event? What are the specific fields in the data structure?&quot; They can also specify what we can do with all this information.<a href="http://www.opml.org/spec" target="_blank">OPML (Outline Processor Markup Language)</a> is a hierarchical file format for storing microcontent and structured data. It was developed by <a href="http://en.wikipedia.org/wiki/Dave_Winer" target="_blank">Dave Winer</a> of RSS and podcast fame.<br /><br />Events are one popular type of microcontent. <a href="http://www.openevents.com" target="_blank">OpenEvents</a> is already working to create shared databases of standardized events, which would get used by a new generation of event portalsâsuch as <a href="http://eventful.com/gotevents/" target="_blank">Eventful/EVDB</a>, <a href="http://upcoming.org/" target="_blank">Upcoming.org</a>, and <a href="http://www.whizspark.com/" target="_blank">WhizSpark</a>. The idea of OpenEvents is that event-oriented systems and services can work together to establish shared events databases (and associated APIs) that any developer could then use to create and offer their own new service or application. <a href="http://marc.blogs.it/archives/2005/04/rvw_redux_openr.html" target="_blank">OpenReviews</a> is still in the conceptual stage, but it would make it possible to provide open alternatives to closed systems like Epinions, and establish a shared database of local and global reviews. Its shared open servers would be filled with all sorts of reviews for anyone to access. <br /><br />Why is this important? Because I predict that in the future, 10 times more people will be writing reviews than maintaining their own blog. The list of possible microcontent standards goes on: OpenJobpostings, OpenRecipes, and even OpenLists. Microsoft <a href="http://www.reallysimplesyndication.com/2005/06/22" target="_blank">recently revealed</a> that it has been working on an important new kind of microcontent: Listsâso OpenLists will attempt to establish standards for the <i>kind</i>Â of lists we all use, such as lists of Links, lists of To Do Items, lists of People, Wish Lists, etc.<br /><br /><b>Movers and Shakers:</b><br /><a href="http://tantek.com/log/2005/09.html" target="_blank">Tantek Ãelik</a> and <a href="http://en.wikipedia.org/wiki/Kevin_Marks" target="_blank">Kevin Marks</a> of <a href="http://developers.technorati.com/wiki/MicroFormats" target="_blank">Technorati</a>, <a href="http://dannyayers.com/" target="_blank">Danny Ayers</a>, <a href="http://www.meyerweb.com/" target="_blank">Eric Meyer</a>, <a href="http://photomatt.net/" target="_blank">Matt Mullenweg</a>, <a href="http://zlab.commerce.net/" target="_blank">Rohit Khare</a>, <a href="http://ifindkarma.typepad.com/relax/" target="_blank">Adam Rifkin</a>, <a href="http://www.sivas.com/aleene/" target="_blank">Arnaud Leene</a>, <a href="http://radio.weblogs.com/0110772/" target="_blank">Seb Paquet</a>, <a href="http://hublog.hubmed.org/" target="_blank">Alf Eaton</a>, <a href="http://www.myelin.co.nz/post/" target="_blank">Phil Pearson</a>, <a href="http://www.joereger.com/" target="_blank">Joe Reger</a>, <a href="http://bobwyman.pubsub.com/" target="_blank">Bob Wyman</a> among others.<br /><br /><br /><b>5.	Open Social Networks</b><br /><br />I&#39;ll never forget the first time I met <a href="http://www.jabrams.com/" target="_blank">Jonathan Abrams</a>, the founder of Friendster. He was arrogant and brash and he claimed he &quot;<i>owned</i>&quot;Â  all his users, and that he was going to monetize them and make a fortune off them. This attitude robbed Friendster of its momentum, letting MySpace, Facebook, and other social networks take Friendster&#39;s place.<br /><br />Jonathan&#39;s notion of social networks as a way to control users is typical of the Web 1.0 business model and its attitude towards users in general. Social networks have become one of the battlegrounds between old and new ways of thinking. Open standards for Social Networking will define those sides very clearly. Since meeting Jonathan, I have been working towards finding and establishing open standards for social networks. Instead of closed, centralized social networks with 10 million people in them, the goal is making it possible to have 10 million social networks that each have 10 people in them.<br /><br />FOAF (which stands for Friend Of A Friend, and describes people and relationships in a way that computers can parse) is a schema to represent not only your personal profile&#39;s meta-data, but your social network as well. Thousands of researchers use the <a href="http://www.foaf-project.org/" target="_blank">FOAF schema</a> in their &quot;Semantic Web&quot; projects to connect people in all sorts of new ways. <a href="http://gmpg.org/xfn/" target="_blank">XFN</a> is a microformat standard for representing your social network, while <a href="http://www.imc.org/pdi/" target="_blank">vCard</a> (long familiar to users of contact manager programs like Outlook) is a microformat that contains your profile information. Microformats are baked into any xHTML webpage, which means that<i>any</i>Â blog, social network page, or any webpage in general can &quot;contain&quot; your social network in itÂand be used by<i>any</i>Â compatible tool, service or application. <br /><br />PeopleAggregator is an earlier project now being integrated into <a href="http://drupal.org/" target="_blank">open content management framework Drupal</a>. The <a href="http://www.broadbandmechanics.com/PeopleAggregator/" target="_blank">PeopleAggregator APIs</a> will make it possible to establish relationships, send messages, create or join groups, and post between different social networks. (Sneak preview: this technology will be available in the upcoming GoingOn Network.) <br /><br />All of these open social networking standards mean that inter-connected social networks will form a mesh that will parallel the blogosphere. This vibrant, distributed, decentralized world will be driven by open standards: personalized online experiences are what the new open web will be all aboutÂand what could be more personalized than people&#39;s networks?<br /><br /><b>Movers and Shakers:</b><br /><a href="http://esigler.2nw.net/" target="_blank">Eric Sigler</a>, <a href="http://lucifer.intercosmos.net/index.php?view=about" target="_blank">Joel De Gan</a>, <a href="http://crschmidt.net/" target="_blank">Chris Schmidt</a>, <a href="http://voidstar.com/" target="_blank">Julian Bond</a>, <a href="http://people.tribe.net/paul?_click_path=Application%5Btribe%5D.Person%5Bf2232c95-e123-43a3-b48d-24a5f11f09dc%5D&r=10535" target="_blank">Paul Martino</a>, <a href="http://napsterization.org/stories/archives/000513.html" target="_blank">Mary Hodder</a>, <a href="http://public.2idi.com/=Drummond.Reed" target="_blank">Drummond Reed</a>, <a href="http://danbri.org/" target="_blank">Dan Brickley</a>, <a href="http://360.yahoo.com/profile-9lciejI3aafX1stHPoIRNmkmv4EowQ--" target="_blank">Randy Farmer</a>, and <a href="http://www.kaliyasblogs.net/Iwoman/" target="_blank">Kaliya Hamlin</a>, to name a few.<br /><br /><br /><b>6.	Tags</b><br /><br />Nowadays, no self-respecting tool or service can ship without <a href="http://www.salon.com/tech/feature/2005/02/08/tagging/index_np.html" target="_blank">tags</a>. Tags are keywords or phrases attached to photos, blog posts, URLs, or even video clips. These user- and creator-generated tags are an open alternative to what used to be the domain of librarians and information scientists: categorizing information and content using taxonomies. Tags are instead creating <a href="http://www.wired.com/wired/archive/13.04/view.html?pg=4" target="_blank">&quot;folksonomies.&quot;</a><br /><br />The recently proposed OpenTags concept would be an open, community-owned version of the popular <a href="http://www.technorati.com/tag/" target="_blank">Technorati Tags service</a>. It would aggregate the usage of tags across a wide range of services, sites, and content tools. In addition to Technorati&#39;s current tag features, OpenTags would let groups of people share their tags in &quot;<a href="http://www.zeldman.com/daily/0405d.shtml/" target="_blank">TagClouds</a>.&quot; Open tagging is likely to include some of the open identity features discussed above, to create a tag system that is resilient to spam, and yet trustable across sites all over the web.<br /><br />OpenTags owes a debt to earlier versions of shared tagging systems, which include <a href="http://www.topicexchange.com/" target="_blank">Topic Exchange</a> and something called the <a href="http://www.evectors.com/itkcollector/" target="_blank">k-collector</a>Âa knowledge management tag aggregatorÂfrom Italian company eVectors. <br /><br /><b>Movers &amp; Shakers:</b><br /><a href="http://www.myelin.co.nz/notes/" target="_blank">Phil Pearson</a>, <a href="http://matt.blogs.it/" target="_blank">Matt Mower </a>, <a href="http://paolo.evectors.it/" target="_blank">Paolo Valdemarin</a>, and <a href="http://marc.blogs.it/archives/2005/03/opentopics.html" target="_blank">Mary Hodder</a> and <a href="http://www.equalsdrummond.name/index.php?p=39" target="_blank"> Drummond Reed</a> again, among others.<br /><br /><br /><b>7. Pinging</b><br /><br />Websites used to be mostly static. Search engines that <a href="http://en.wikipedia.org/wiki/Web_crawler" target="_blank">crawled</a> (or &quot;spidered&quot;) them every so often did a good enough job to show reasonably current versions of your cousin&#39;s homepage or even <i>Time</i>Â magazine&#39;s weekly headlines. But when blogging took off, it became hard for search engines to keep up. (Google has only <a href="http://searchenginewatch.com/searchday/article.php/3548411" target="_blank">just managed</a> to offer <a href="http://www.google.com/help/about_blogsearch.html" target="_blank">blog-search functionality</a>, despite <a href="http://www.alwayson-network.com/comments.php?id=325_0_2_0_C" target="_blank">buying Blogger</a> back in early 2003.)<br /><br />To know what was new in the blogosphere, users couldn&#39;t depend on services that spidered webpages once in a while. The solution: a way for blogs themselves to automatically notify blog-tracking sites that they&#39;d been updated. <a href="http://weblogs.com/" target="_blank">Weblogs.com</a> was the first blog &quot;ping service&quot;: it displayed the name of a blog whenever that blog was updated. Pinging sites helped the blogosphere grow, and <a href="http://blo.gs/" target="_blank">more tools</a>, services, and portals started using pinging in new and different ways. Dozens of pinging services and sitesÂmost of which can&#39;t talk to each otherÂsprang up. <br /><br />Matt Mullenweg (the creator of open source blogging software WordPress) decided that a one-stop service for pinging was needed. He created <a href="http://pingomatic.com/" target="_blank">Ping-o-Matic</a>Âwhich aggregates ping services and simplifies the pinging process for bloggers and tool developers. With Ping-o-Matic, any developer can alert all of the industry&#39;s blogging tools and tracking sites at once. This new kind of open standard, with shared infrastructure, is a critical to the scalability of Web 2.0 services.<br /><br />As <a href="http://pingomatic.com/about/" target="_blank">Matt said</a>:<br /><blockquote>There are a number of services designed specifically for tracking and connecting blogs. However it would be expensive for all the services to crawl all the blogs in the world all the time. By sending a small ping to each service you let them know you&#39;ve updated so they can come check you out. They get the freshest data possible, you don&#39;t get a thousand robots spidering your site all the time. Everybody wins.</blockquote><br /><b>Movers and Shakers:</b><br /><a href="http://photomatt.net/about/" target="_blank">Matt Mullenweg</a>, <a href="http://trainedmonkey.com/entry/2251" target="_blank">Jim Winstead</a>, <a href="http://newhome.weblogs.com/faq" target="_blank">Dave Winer</a><br /><br /><br /><b>8. Routing</b><br /><br />Bloggers used to have to manually enter the links and content snippets of blog posts or news items they wanted to blog. Today, some RSS aggregators can send a specified post directly into an associated blogging tool: as bloggers browse through the feeds they subscribe to, they can easily specify and send any post they wish to &quot;<a href="http://www.microsoftmonitor.com/archives/010209.html" target="_blank">reblog</a>&quot; from their news aggregator or feed reader into their blogging tool. (This is usually referred to as &quot;<a href="http://help.blogger.com/bin/answer.py?answer=152&topic=17" target="_blank">BlogThis</a>.&quot;) As structured blogging comes into its own (see the section on Microcontent Publishing), it will be increasingly important to maintain the structural integrity of these pieces of microcontent when reblogging them. <br /><br />Promising standard <a href="http://redirectthis.com/" target="_blank">RedirectThis</a> will combine a &quot;BlogThis&quot;-like capability while maintaining the integrity of the microcontent. RedirectThis will let bloggers and content developers attach a simple &quot;PostThis&quot; button to their posts. Clicking on that button will send that post to the reader/blogger&#39;s favorite <a href="http://ecto.kung-foo.tv/archives/000990.php" target="_blank">blogging tool</a>. This favorite tool is specified at the RedirectThis web service, where users register their blogging tool of choice. RedirectThis also helps maintain the integrity and structure of microcontentÂthen it&#39;s just up to the user to prefer a blogging tool that also attains that lofty goal of microcontent integrity. <br /><br />OutputThis is another nascent web services standard, to let bloggers specify what &quot;destinations&quot; they&#39;d like to have as options in their blogging tool. As new destinations are added to the service, more checkboxes would get added to their blogging toolÂallowing them to route their published microcontent to additional destinations.<br /><br /><b>Movers and Shakers:</b><br /><a href="http://reblog.org/" target="_blank">Michael Migurski</a>, <a href="http://www.gonze.com/about" target="_blank">Lucas Gonze</a><br /><br /><br /><b>9. Open Communications</b><br /><br />Likely, you&#39;ve experienced the joys of finding friends on AIM or Yahoo Messenger, or the convenience of Skyping with someone overseas. Not that you&#39;re about to throw away your mobile phone or BlackBerry, but for many, also having access to Instant Messaging (IM) and Voice over IP (VoIP) is crucial. <br /><br />IM and VoIP are mainstream technologies that already enjoy the benefits of open standards. Entire industries are bornÂright this secondÂbased around these open standards. <a href="http://www.jabber.org/" target="_blank">Jabber</a> has been an open IM technology for yearsÂin fact, <a href="http://www.xmpp.org/history.html" target="_blank">as XMPP</a>, it was officially dubbed a standard by <a href="http://www.ietf.org/overview.html" target="_blank">the IETF</a>. Although becoming an <a href="http://en.wikipedia.org/wiki/IETF" target="_blank">official IETF standard</a> is usually the kiss of death, Jabber looks like it&#39;ll be around for a while, as entire generations of collaborative, work-group applications and services have been built on top of its messaging protocol. For VoIP, <a href="http://skype.com/helloagain.html" target="_blank">Skype</a> is clearly the leading standard todayÂthough one could <a href="http://socialsoftware.weblogsinc.com/entry/1234000923058521/" target="_blank">argue just how &quot;open&quot; it is</a> (and defenders of the IETF&#39;s <a href="http://www.cs.columbia.edu/sip/" target="_blank">SIP standard</a> often do). But it is free and user-friendly, so there won&#39;t be much argument from <i>users</i>Â  about it being insufficiently open. Yet there may be a cloud on Skype&#39;s horizon: web behemoth Google recently released a beta of <a href="http://www.google.com/talk/developer.html" target="_blank">Google Talk, an IM client committed to open standards</a>. It currently <a href="http://radar.oreilly.com/archives/2005/08/google_talk_rel.html" target="_blank">supports XMPP, and will support SIP</a> for VoIP calls.<br /><br /><b>Movers and Shakers:</b><br /><a href="http://www.jabber.org/people/jer.shtml" target="_blank">Jeremie Miller</a>, <a href="http://www.cs.columbia.edu/~hgs/" target="_blank">Henning Schulzrinne</a>, <a href="http://www.von.com/schedule_eos11114704148.html" target="_blank">Jon Peterson</a>, <a href="http://www.pulver.com/jeff/" target="_blank">Jeff Pulver</a><br /><br /><br /><b>10. Device Management and Control</b><br /><br />To access online content, we&#39;re using more and more devices. BlackBerrys, iPods, Treos, you name it. As the web evolves, more and more different devices will have to communicate with each other to give us the content we want when and where we want it. No-one wants to be dependent on one vendor anymoreÂlike, <a href="http://www.alwayson-network.com/comments.php?id=P9409_0_6_0_C" target="_blank">say, Sony</a>Âfor their laptop, phone, MP3 player, PDA, and digital camera, so that it all works together. We need fully interoperable devices, and the standards to make that work. And to fully make use of how content is moving online content and innovative web services, those standards need to be open.<br /><br /><a href="http://en.wikipedia.org/wiki/Midi" target="_blank">MIDI (musical instrument digital interface)</a>, one of the very first open standards in music, connected disparate vendors&#39; instruments, post-production equipment, and recording devices. But MIDI is limited, and <a href="http://www.oreillynet.com/pub/wlg/8015" target="_blank">MIDI II has been very slow to arrive</a>. Now a new standard for controlling musical devices has emerged: <a href="http://www.cnmat.berkeley.edu/OpenSoundControl/" target="_blank">OSC (Open SoundControl)</a>. This protocol is optimized for modern networking technology and inter-connects music, video and controller devices with &quot;other multimedia devices.&quot; OSC is used by a wide range of developers, and is being taken up in the mainstream MIDI marketplace.<br /><br />Another open-standards-based device management technology is <a href="http://www.zigbee.org" target="_blank">ZigBee</a>, for building wireless intelligence and network monitoring into all kinds of devices. ZigBee is supported by many networking, consumer electronics, and mobile device companies.<br /><br /><br />Â  Â  Â  Â· Â· Â· Â· Â· Â· Â  Â  <br /><br /><b>The Change to Openness</b><br /><br />The rise of open source software and its &quot;<a href="http://www.oreillynet.com/pub/a/oreilly/tim/articles/architecture_of_participation.html" target="_blank">architecture of participation</a>&quot; are completely shaking up the old proprietary-web-services-and-standards approach. Sun MicrosystemsÂwhose proprietary Java standard helped define the Web 1.0Âis opening its Solaris OS and has even announced the apparent paradox of an <a href="http://blogs.zdnet.com/open-source/?p=418" target="_blank">open-source Digital Rights Management</a> system.<br /><br />Today&#39;s incumbents will have to adapt to the new openness of the Web 2.0. If they stick to their <a href="http://www.gartner.com/DisplayDocument?doc_cd=131038" target="_blank">proprietary standards</a>, code, and content, they&#39;ll become the new walled gardensÂplaces users visit briefly to retrieve data and content from enclosed data silos, but not where users &quot;live.&quot; The incumbents&#39; revenue models will have to change. Instead of &quot;owning&quot; their users, users will know they own themselves, and will expect a return on their valuable identity and attention. Instead of being locked into incompatible media formats, users will expect easy access to digital content across many platforms. <br /><br />Yesterday&#39;s web giants and tomorrow&#39;s users will need to find a mutually beneficial new balanceÂbetween open and proprietary, developer and user, hierarchical and horizontal, owned and shared, and compatible and closed. <br /><br /><br /><i>Marc Canter is an active evangelist and developer of open standards. Early in his career, Marc founded MacroMind, which became Macromedia. These days, he is CEO of Broadband Mechanics, a founding member of the Identity Gang and of ourmedia.org. Broadband Mechanics is currently developing the <a href="http://www.alwayson-network.com/comments.php?id=11262_0_1_0_C" target="_blank">GoingOn Network</a> (with the AlwaysOn Network), as well as an open platform for social networking called the PeopleAggregator.</i><br /><br />A version of the above post appears in the Fall 2005 issue of AlwaysOn&#39;s quarterly print blogozine, and ran as <a href="http://www.alwayson-network.com/comments.php?id=12063_0_1_0_C" target="_blank">a four-part series</a> on the AlwaysOn Network website.</td></tr></table><br /><p>(Via <a href="http://marc.blogs.it/">Marc&#39;s Voice</a>.)</p></blockquote>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2005-04-26#810">
  <rss:title>WebDAV, SQLX, and my Weblog</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2005-04-26T03:54:43Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Uche Ogbuji comments in his blog about the use of WebDAV and SQLX in my blog as part of his commentary about Pyblosxom &amp; WebDAV. To provide some clarity about Virtuoso and Blogging I have decided to put out this quick step by guide to the workings of my blog (there is a long overdue technical white paper nearing completion that address this subject in more detail). Here goes: Blog Editing I can use any editor that supports the following Blog Post APIs: - Moveable Type - Meta Weblog - Blogger Typically I use Virtuoso (which has an unreleased WYSIWYG blog post editor), Newzcrawler, ecto, Zempt, or w.bloggar for my posts. If a post is of interest to me, or relevant to our company or customers I tend to perform one of the following tasks: - Generate a post using the &quot;Blog This&quot; feature of my blog editor - Write a new post that was triggered by a previously read post etc. Either way, the posts end up in our company wide blog server that is Virtuoso based (more about this below). The internal blog server automatically categorizes my blog posts, and automagically determines which posts to upstream to other public blogs that I author (e.g http://kidehen.typepad.com ) or co-author (e.g http://www.openlinksw.com/weblogs/uda and http://www.openlinksw.com/weblogs/virtuoso ). I write once and my posts are dispatched conditionally to multiple outlets. RSS/Atom/RDF Aggregation &amp; Reading I discover, subscribe to, and view blog feeds using Newzcrawler (primarily), and from time to time for experimentation and evaluation purposes I use RSS Bandit, FeedDemon, and Bloglines. I am in the process of moving this activity over to Virtuoso completely due to the large number of feeds that I consume on a daily basis (scalability is a bit of a problem with current aggregators). Blog Publishing When you visit my blog you are experiencing the  soon to be released Virtuoso Blog Publishing engine first hand, which is how WebDAV, SQLX, XQuery/XPath, and Free Text etc. come into the mix. Each time I create a post internally, or subscribe to an external feed, the data ends up in Virtuoso&#39;s SQL Engine (this is how we handle some of the obvious scalability challenges associated with large subscription counts). This engine is SQL2000N based, which implies that it can transform SQL to XML on the fly using recent extensions to SQL in the form of SQLX (prior to the emergence of this standard we used the FOR XML SQL syntax extensions for the same result). It also has its own in-built XSLT processor (DB Engine resident), and validating XML parser (with support for XML Schema).  Thus, my RSS/RDF/Atom archives, FOAF, BlogRoll, OPML, and OCS blog syndication gems are all live examples of SQLX documents that leverage Virtuoso&#39;s WebDAV engine for exposure to Blog Clients. Blog Search When you search for blog posts using the basic or advanced search features of my blog, you end up interacting with one of the following methods of querying data hosted in Virtuoso: Free Text Search, XPath, or XQuery. The result sets produced by the search feature uses SQLX to produce subscription gems (RSS/Atom/RDF/ blog home page exists as a result of Virtuoso&#39;s Virtual Domain / Multi-Homing Web Server functionality. The entire site resides in an Object Relational DBMS, and I can take my DB file across Windows, Solaris, Linux, Mac OS X, FreeBSD, AIX, HP-UX, IRIX, and SCO UnixWare without missing a single beat! All I have to do is instantiate my Virtuoso server and my weblog is live.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p>Uche Ogbuji <a href="http://copia.ogbuji.net/blog/2005/04/24#Posting_to">comments</a> in his <a href="http://copia.ogbuji.net/blog">blog</a> about the use of WebDAV and <a href="http://www.tbradford.org/2005/02/xml-with-virtuoso-and-sqlx_02.html">SQLX </a>in my blog as part of his commentary about <a href="http://egaumer.pagecache.org/PyBlosxom/pyblosxom-webdav.html">Pyblosxom &amp; WebDAV</a>. To provide some clarity about Virtuoso and Blogging I have decided to put out this quick step by guide to the workings of my blog (there is a long overdue technical white paper nearing completion that address this subject in more detail).</p>
<p>Here goes:</p>
<p><u><strong>Blog Editing</strong></u></p>
<p>I can use any editor that supports the following Blog Post APIs:</p>
<p>- Moveable Type</p>
<p>- Meta Weblog</p>
<p>- Blogger</p>
<p>Typically I use Virtuoso (which has an unreleased&nbsp;WYSIWYG blog post editor), <a href="http://www.newzcrawler.com/">Newzcrawler</a>, <a href="http://ecto.kung-foo.tv/">ecto</a>, <a href="http://zempt.com/">Zempt</a>, or <a href="http://www.wbloggar.com/">w.bloggar</a> for my posts. If a post is of interest to me, or relevant to our company or customers&nbsp;I tend to perform one of the following tasks:</p>
<p>- Generate a post using the "Blog This" feature of my blog editor</p>
<p>-&nbsp;Write a new post that was triggered by a previously read post etc.</p>
<p>Either way, the posts end up in our company wide blog server that is Virtuoso based (more about this below). The internal blog server automatically categorizes my blog posts, and automagically determines which posts to upstream to other public blogs that I author (e.g <a href="http://kidehen.typepad.com/">http://kidehen.typepad.com</a> ) or co-author (e.g <a href="http://www.openlinksw.com/weblogs/uda">http://www.openlinksw.com/weblogs/uda</a> and <a href="http://www.openlinksw.com/weblogs/virtuoso">http://www.openlinksw.com/weblogs/virtuoso</a> ). I write once and my posts are dispatched conditionally to multiple outlets.</p>
<p><strong><u>RSS/Atom/RDF Aggregation &amp; Reading</u></strong></p>
<p>I discover, subscribe to, and&nbsp;view blog feeds using <a href="http://www.newzcrawler.com/">Newzcrawler</a> (primarily), and from time to time for experimentation and evaluation purposes I use <a href="http://www.rssbandit.org/">RSS Bandit</a>,&nbsp;<a href="http://www.bradsoft.com/feeddemon/">FeedDemon</a>, and <a href="http://www.bloglines.com/">Bloglines</a>. I am in the process of moving this activity over to Virtuoso completely due to the large number of feeds that I consume on a daily basis (scalability is a bit of a problem with current aggregators).</p>
<p><u><strong>Blog Publishing</strong></u></p>
<p>When you visit my blog you are experiencing the&nbsp; soon to be released Virtuoso Blog Publishing engine first hand, which is how&nbsp;WebDAV, SQLX, XQuery/XPath, and Free Text etc. come into the mix.</p>
<p>Each time I create a post internally, or subscribe to an external feed, the data ends up in Virtuoso's SQL Engine (this is how we handle some of the obvious scalability challenges associated with large subscription counts). This engine is SQL2000N based, which implies that it can transform SQL to XML on the fly using recent extensions to SQL in the form of SQLX (prior to the emergence of this standard we used the FOR XML SQL syntax extensions for the same result). It also has its own in-built XSLT processor (DB Engine&nbsp;resident), and validating XML parser (with support for XML Schema).&nbsp; Thus, my <a href="http://www.openlinksw.com/blog/~kidehen/gems/">RSS/RDF/Atom archives, FOAF, BlogRoll, OPML, and OCS</a> blog syndication gems are all live examples of SQLX documents that leverage Virtuoso's WebDAV engine for exposure to&nbsp;Blog Clients.</p>
<p><strong><u>Blog Search</u></strong></p>
<p>When you search for blog posts using the basic or <a href="http://www.openlinksw.com/blog/search.vspx?blogid=127">advanced search</a> features of my blog, you end up interacting with one of the following methods of querying data hosted in Virtuoso: Free Text Search, XPath, or XQuery. The <a href="http://www.openlinksw.com/blog/search.vspx?blogid=127&q=virtuoso&type=text&output=html">result sets</a> produced by the search feature uses SQLX to produce subscription gems (<a href="http://www.openlinksw.com/blog/search.vspx?blogid=127&q=virtuoso&type=text&output=xml">RSS</a>/<a href="http://www.openlinksw.com/blog/search.vspx?blogid=127&q=virtuoso&type=text&output=atom">Atom</a>/<a href="http://www.openlinksw.com/blog/search.vspx?blogid=127&q=virtuoso&type=text&output=rdf">RDF</a>/<a href="http://www.openlinksw.com/blog/search.vspx?blogid=127&type=text&kwds=virtuoso&OpenSearch">OpenSearch</a>) and <a href="http://www.openlinksw.com/blog/search.vspx?blogid=127&q=virtuoso&type=text&output=html">URIs</a> that enable dynamic tracking of my posts using your search keywords.</p>
<p>BTW - the <a href="http://www.openlinksw.com/blog/~kidehen">http://www.openlinksw.com/blog/~kidehen</a> blog home page exists as a result of Virtuoso's Virtual Domain / Multi-Homing Web Server functionality. The entire site resides in an Object Relational DBMS, and I can take my DB file across Windows, Solaris, Linux, Mac OS X, FreeBSD, AIX, HP-UX, IRIX, and SCO UnixWare without missing a single beat! All I have to do is instantiate my Virtuoso server and my weblog is live.</p>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2005-04-21#793">
  <rss:title>Mac OS X and its potential impact on Windows</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2005-04-21T20:25:16Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">We are at an interesting crossroads in the computer industry (IMHO) . Apple is about to unleash Tiger (ETA: one week from now), and this operating system release could end up being the crucial round of the titanic battle between Apple and Microsoft. The battle which starts at the Operating System level reminds me of the &quot;Rumble In The Jungle&quot; (circa. 1974, Kinshasa, Zaire); Apple in the role of Ali (aka &quot;The Greatest&quot; who was the overwhelming underdog at time) and Microsoft in the role of George Foreman (who at the time was logically invincible). The shakesperian tale of Macbeth also comes to mind as depicted in the excerpt below: &quot;.... Macbeth goes to visit the witches in their cavern. There, they show him a sequence of demons and spirits who present him with further prophecies: he must beware of Macduff, a Scottish nobleman who opposed Macbeth&#39;s accession to the throne; he is incapable of being harmed by any man born of woman; and he will be safe until Birnam Wood comes to Dunsinane Castle. &quot; Having used all the major operating systems on a serious basis for a number of years in a variety of modes; user, developer, and administrator. I have always felt that a RISC based UNIX operating system (of BSD genealogical branch extraction), if somehow combined with a user interface that is superior to Windows, would ultimately unravel the Windows Desktop Monopoly. That operating system exists today in the form of Mac OS X (its lastest Tiger release simply kicks the differential up a notch). Back to the Macbeth correlation: &quot;Birnam Woods coming to Dunsinane&quot; is the metaphoric equivalent of desktop users and first time computer users being forced (by the scourge of virus and spyware) to revaluate Windows as the only choice for productive desktop computing. What would you recommend to &quot;Aunt Milly&quot; when she tells you she wants to get on the Internet? Especially if &quot;Aunt Milly&quot; isn&#39;t living with you? &quot;Man not born of a woman&quot; is no different to saying: UNIX with a superior user interface to Windows! I don&#39;t think you need me to tell who play the characters of Macbeth and Macduff in this drama :-) The Windows security vulnerabilities quagmire (google juice on this phrase is currently 6,620 pages) has basically created an inflection of monumental proportions adversely affecting Windows and creating great visibility and evaluation building opportunities for Mac OS X (&quot;once users experience a Mac they don&#39;t come back to Windows!&quot;). Paul Murphy of cio-today.com has also written a great article sheds light on the often overlooked hardware aspect to the security problem for Windows Here is a poignant excerpt: Software and Hardware Vulnerabilities At present, attacks on Microsoft&#39;s Windows products are generally drawn from a different population of possible attacks than those on Unix variants such as BSD, Linux and Solaris. From a practical perspective, the key difference is that attacks on Wintel tend to have two parts: A software vulnerability is exploited to give a remote attacker access to the x86 hardware and that access is then used to gain control of the machine. In contrast, attacks on Unix generally require some form of initial legal access to the machine and focus on finding software ways to upgrade priveleges illegally. Consider, for example, CAN-2004-1134 in the NIST vulnerabilities database: Summary: Buffer overflow in the Microsoft W3Who ISAPI (w3who.dll) allows remote attackers to cause a denial of service and possibly execute arbitrary code via a long query string. Published Before: 1/10/2005 Severity: High The vulnerability exists in Microsoft&#39;s code, but the exploit depends on the rigid stack-order execution and limited page protection inherent in the x86 architecture. If Windows ran on Risc, that vulnerability would still exist, but it would be a non-issue because the exploit opportunity would be more theoretical than practical. Linux and open-source applications are thought to have far fewer software vulnerabilities than Microsoft&#39;s products, but Linux on Intel (Nasdaq: INTC - news) is susceptible to the same kind of attacks as those now predominantly affecting Wintel users. For real long-term security improvements, therefore, the right answer is to look at Linux, or any other Unix, on non x86 hardware. One such option is provided by Apple&#39;s (Nasdaq: AAPL - news) BSD-based products on the PowerPC-derived G4 and G5 CPUs. Linus Torvalds, for example, apparently now runs Linux on a Mac G5 and there are several Linux distributions for this hardware -- all of which are immune to the typical x86-oriented exploit. This may even been the nullifier of that age old argument about porting Mac OS X to the x86 in order to broaden its adoption potential? Mac OS X is certainly a breath of fresh air for anyone who needs to simply get stuff done with their desktops and notebooks.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p dir="ltr">We are at an interesting crossroads in the computer industry (IMHO) . Apple is about to unleash <a href="http://www.apple.com/macosx/">Tiger</a> (ETA: one week from now), and this operating system release could end up being the crucial round of the titanic battle between Apple and Microsoft. The battle which starts&nbsp;at the Operating System level reminds me of the&nbsp;"<a href="http://home.sandiego.edu/~murphy2/jungle.html">Rumble In The Jungle</a>" (circa. 1974, <a href="http://www.answers.com/main/ntquery?s=Kinshasa&method=2&gwp=13">Kinshasa</a>, <a href="http://www.answers.com/topic/congo-country-zaire&method=6">Zaire</a>); Apple in the role of <a href="http://www.answers.com/topic/muhammad-ali-boxer&method=6">Ali</a> (aka "The Greatest" who was the overwhelming underdog at time) and Microsoft in the role of <a href="http://www.answers.com/topic/george-foreman&method=6">George Foreman</a> (who at the time was logically invincible). </p>
<p dir="ltr">The shakesperian tale of Macbeth also comes to mind as depicted in the excerpt below:</p>
<blockquote dir="ltr" style="MARGIN-RIGHT: 0px">
<p dir="ltr">".... Macbeth goes to visit the witches in their cavern. There, they show him a sequence of demons and spirits who present him with further prophecies: he must beware of Macduff, a Scottish nobleman who opposed Macbeth's accession to the throne; he is incapable of being harmed by any man born of woman; and he will be safe until Birnam Wood comes to Dunsinane Castle. "</p></blockquote>
<p dir="ltr">Having used all the major operating systems on a serious basis for a number of years in a variety of&nbsp;modes;&nbsp;user, developer, and administrator. I have always felt that a RISC based UNIX operating system (of BSD genealogical branch extraction), if somehow combined with a user interface that is superior to Windows,&nbsp;would ultimately&nbsp;unravel the Windows Desktop Monopoly. That&nbsp;operating system exists today in the form of Mac OS X (its lastest Tiger release simply <a href="http://www.apple.com/macosx/newfeatures/">kicks the differential up a notch</a>). </p>
<p dir="ltr">Back to the Macbeth correlation:</p>
<blockquote dir="ltr" style="MARGIN-RIGHT: 0px">
<p dir="ltr"><u>"Birnam Woods coming to Dunsinane"</u> is the metaphoric equivalent of desktop users and first time computer users being forced (by the scourge of virus and spyware) to revaluate Windows as the only choice for productive desktop computing. What would you recommend to "Aunt Milly" when she tells you she wants to get on the Internet? Especially if "Aunt Milly" isn't living with you?</p>
<p dir="ltr">"<u>Man not born of a woman"</u> is no different to saying: UNIX with a superior user interface to Windows!</p>
<p dir="ltr">I don't think you need me to tell who play the characters of Macbeth and Macduff in this drama :-)</p></blockquote>
<p dir="ltr">The Windows security vulnerabilities quagmire (<a href="http://www.google.com/search?q=Windows+security+vulnerabilities+quagmire&sourceid=mozilla-search&start=0&start=0&ie=utf-8&oe=utf-8&client=firefox-a&rls=org.mozilla:en-US:official">google juice</a> on this phrase is currently 6,620 pages)&nbsp;has basically created an inflection of monumental proportions adversely affecting Windows and creating great visibility and evaluation building opportunities for Mac OS X ("once users&nbsp;experience a&nbsp;Mac they don't come back to Windows!").</p>
<p dir="ltr">Paul Murphy of <a href="http://www.cio-today.com/">cio-today.com</a>&nbsp;has also written a great article&nbsp;sheds light on the&nbsp;often overlooked hardware aspect to the security problem for Windows&nbsp;Here is a poignant excerpt:</p>
<blockquote dir="ltr" style="MARGIN-RIGHT: 0px">
<p><font face="arial" size="-1"><b>Software and Hardware Vulnerabilities</b> </font></p>
<p><font face="arial" size="-1"></font></p>
<p><font face="arial" size="-1">At present, attacks on Microsoft's Windows products are generally drawn from a different population of possible attacks than those on <span class="keyword"><a href="http://us.rd.yahoo.com/DailyNews/manual/nf/bs_nf/33272/14945921/*http://news.search.yahoo.com/search/news?fr=news-storylinks&p=%22Unix%22&c=&n=20&yn=c&c=news&cs=nw">Unix</a></span> variants such as BSD, Linux and Solaris. From a practical perspective, the key difference is that attacks on Wintel tend to have two parts: A software vulnerability is exploited to give a remote attacker access to the x86 hardware and that access is then used to gain control of the machine. </font></p>
<p><font face="arial" size="-1"></font></p>
<p><font face="arial" size="-1">In contrast, attacks on Unix generally require some form of initial legal access to the machine and focus on finding software ways to upgrade priveleges illegally. </font></p>
<p><font face="arial" size="-1"></font></p>
<p><font face="arial" size="-1">Consider, for example, CAN-2004-1134 in the NIST vulnerabilities database: </font></p>
<p><font face="arial" size="-1"></font></p>
<p><font face="arial" size="-1">Summary: Buffer overflow in the Microsoft W3Who ISAPI (w3who.dll) allows remote attackers to cause a denial of service and possibly execute arbitrary code via a long query string. </font></p>
<p><font face="arial" size="-1"></font></p>
<p><font face="arial" size="-1">Published Before: 1/10/2005 </font></p>
<p><font face="arial" size="-1"></font></p>
<p><font face="arial" size="-1">Severity: High </font></p>
<p><font face="arial" size="-1"></font></p>
<p><font face="arial" size="-1">The vulnerability exists in Microsoft's code, but the exploit depends on the rigid stack-order execution and limited page protection inherent in the x86 architecture. If Windows ran on Risc, that vulnerability would still exist, but it would be a non-issue because the exploit opportunity would be more theoretical than practical. </font></p>
<p><font face="arial" size="-1"></font></p>
<p><font face="arial" size="-1">Linux and open-source applications are thought to have far fewer software vulnerabilities than Microsoft's products, but Linux on Intel (<a href="http://us.rd.yahoo.com/dailynews/finance/nf/bs_nf/storytext/33272/14945921/*http://finance.yahoo.com/q?s=intc&d=t">Nasdaq: INTC</a> - <a href="http://us.rd.yahoo.com/dailynews/biz/nf/bs_nf/storytext/33272/14945921/*http://biz.yahoo.com/n/i/intc.html">news</a>) is susceptible to the same kind of attacks as those now predominantly affecting Wintel users. For real long-term security improvements, therefore, the right answer is to look at Linux, or any other Unix, on non x86 hardware. </font></p>
<p><font face="arial" size="-1"></font></p>
<p><font face="arial" size="-1">One such option is provided by Apple's (<a href="http://us.rd.yahoo.com/dailynews/finance/nf/bs_nf/storytext/33272/14945921/*http://finance.yahoo.com/q?s=aapl&d=t">Nasdaq: AAPL</a> - <a href="http://us.rd.yahoo.com/dailynews/biz/nf/bs_nf/storytext/33272/14945921/*http://biz.yahoo.com/n/a/aapl.html">news</a>) BSD-based products on the PowerPC-derived G4 and G5 CPUs. <span class="keyword"><a href="http://us.rd.yahoo.com/DailyNews/manual/nf/bs_nf/33272/14945921/*http://news.search.yahoo.com/search/news?fr=news-storylinks&p=%22Linus%20Torvalds%22&c=&n=20&yn=c&c=news&cs=nw">Linus Torvalds</a></span>, for example, apparently now runs Linux on a Mac G5 and there are several Linux distributions for this hardware -- all of which are immune to the typical x86-oriented exploit. </font></p></blockquote>
<p dir="ltr">This may even been the nullifier of that age old argument about porting Mac OS X to the x86 in order to broaden its adoption potential?</p>
<p dir="ltr">Mac OS X is certainly a breath of fresh air for anyone who needs to simply get stuff&nbsp;done with their&nbsp;desktops and notebooks. </p>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2005-03-26#766">
  <rss:title>Back To The Future: Hypermedia</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2005-03-26T20:24:30Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">If a picture speaks a thousand words, I sometimes wonder how many words we attribute to a multimedia clip? Especially one that is now openly accessible to many who don&#39;t quite understand the high degree of: &quot;Back To The Future&quot; quotient of most of what we see today. The Internet Archive initiative is building up an amazing collection of content that includes this &quot;must watch&quot; movie about the somewhat forgotten hypercard development environment. As I watched the hypercard movie I obtained clear reassurance that my vision of Web 2.0 as critical infrastructure for a future Semantic Web isn&#39;t unfounded. The solution building methodology espoused by hypercard is exactly how Semantic Web applications will be built, and this will be done by orchestrating the componentary of Web 2.0. When watching this clip make the following mental adjustments: Swap hypercard stacks for discrete and/or composite services that have published endpoints exposed by Web 2.0 points of presence Think of information taking the form of XML based content e.g. RSS, Atom, RDF, FOAF, XFN, and other future XML based data contextualization formats; all accessible via URIs When the Apple Mac operating system is mentioned (or infered) think of the Internet (you don&#39;t need Windows, Mac OS, Linux, UNIX etc. to realize the vision, the network provided by the Internet is the Operating System) When the Apple computer is mentioned simply think about a plethora of function specific devices (computers, mobile phones, PDAs etc.) that overtly or covertly provide conduits to the new operating environment (the Internet) As you hear term &quot;whole new body of people that are non programmers contributing there ideas&quot; think about yourself and the increasing ease of participation that&#39;s beginning to take shape in this emerging frontier! As for &quot;Whole Earth Catalog&quot;, think Wikipedia or more recent efforts such as Answers.com. Web 2.0 is a reflection of the web taking its first major step out of the technology stone age (certainly the case relative to the hypercard movie and &quot;pre web&quot; application development in general).  </dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p>If a picture speaks a thousand words, I sometimes wonder how many words we attribute to a multimedia clip? Especially one that is now openly accessible to many who don't quite understand the high degree of: "Back To The Future" quotient of most of what we see today.</p>
<p>The Internet&nbsp;Archive initiative is building up an amazing&nbsp;collection of content&nbsp;that includes this <a href="http://www.archive.org/movies/details-db.php?collection=computerchronicles&collectionid=CC501_hypercard">"must watch" movie</a> about the somewhat forgotten <a href="http://en.wikipedia.org/wiki/Hypercard">hypercard</a> development environment.</p>
<p>As I watched the hypercard movie I obtained clear reassurance that my vision of <a href="http://en.wikipedia.org/wiki/Web_2.0">Web 2.0</a> as critical infrastructure for a future Semantic Web isn't unfounded. The solution building methodology espoused by hypercard is exactly how Semantic Web applications will be built, and this will be done by orchestrating&nbsp;the componentary of Web 2.0.</p>
<p>When watching this clip make the following mental adjustments:</p>
<ol>
<li>Swap hypercard stacks for discrete and/or composite services that have published endpoints exposed by Web 2.0 points of presence<br><br></li>
<li>Think of information taking the form of XML based content e.g. RSS, Atom, RDF, FOAF, XFN, and other future&nbsp;XML based data contextualization&nbsp;formats; all accessible via URIs<br><br></li>
<li>When the Apple Mac operating system is mentioned (or infered) think of the Internet&nbsp;(you don't need Windows, Mac OS, Linux,&nbsp;UNIX etc.&nbsp;to realize the vision, the network provided by the Internet&nbsp;is the Operating System)<br><br></li>
<li>When the Apple computer is mentioned simply think about a plethora of function specific devices (computers, mobile phones, PDAs etc.) that overtly or covertly provide conduits to the new operating environment (the Internet)<br><br></li>
<li>As you hear term "whole new body of people that are non programmers contributing there ideas" think about yourself and the increasing ease of participation&nbsp;that's beginning to take shape in this&nbsp;emerging frontier!<br><br></li>
<li>As for "<a href="http://www.wholeearthmag.com/about.html">Whole Earth Catalog", </a>think <a href="http://en.wikipedia.org">Wikipedia</a>&nbsp;or more recent efforts such as <a href="http://www.answers.com">Answers.com</a>.</li></ol>
<p>Web 2.0 is a reflection of the web taking its first major step out of the technology stone age (certainly the case relative to the hypercard movie and "pre web" application development in general). </p>
<p>&nbsp;</p>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2005-02-23#691">
  <rss:title>Novell&#39;s Response to NT4 support discontinuation</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2005-02-23T15:08:31Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Pretty funny piece from Novell.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[Pretty funny <a href="http://www.novell.com/linux/windowstolinux/publicservice/">piece</a> from Novell.]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2004-11-19#642">
  <rss:title>MacSOS Releases SyBrowser 6.2</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2004-11-19T17:40:38Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">MacSOS Releases SyBrowser 6.2 Dr. Gerard Hammond of MacSOS announced the release of SyBrowser 6.2, a Macintosh application that can query Sybase, FrontBase, PostgreSQL, Oracle, ODBC and MS SQL databases hosted on OSX, UNIX, Linux, and Windows servers. SyBrowser v6.2 features include: - Added FrontBase database support. - Added &quot;Bachman&quot; style ERD features (Tridents for &#39;Many&#39; arms of a relationship, open circles for optional entities) - The arms of a relationship now track their entities correctly in all directions. - The arm of the selected relationship can be moved using the mouse or the keyboard - Fixed bug with SQL auto-completion popup with multiple monitors. - Enhanced the &quot;Edit Relationships Info...&quot; dialog. This dialog allows the properties of the selected relationship to be edited. - The mouse cursor changes to reflect the draggable direction when resizing ERD tables, or dragging the various arms of a relationship. The selected arm of the selected relationship now has a circle for a handle. - Documentation added. - Printing the ERD panel has been improved. - The Find dialog allows searching the returned datasets on the SQL panel and Results windows as well as the code in Sybase stored procedures. SyBrowser Overview SyBrowser is a table browser and alternative &quot;isql&quot; client for Sybase databases. It facilitates SQL generation thorough a point and click interface. SyBrowser also provides an overview of the tables in ODBC, MySQL, Oracle, FrontBase, PostgreSQL and MS SQL databases. Complex queries can be saved to disk for reuse. An ERD module allows the creation of visual representations of data models. $89 Shareware from MacSOS, Australia $49 upgrade from any previous version http://www.macsos.com.au [via RB Garage News Feed]</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<a href="http://feeds.feedburner.com/rbgarage?m=93">MacSOS Releases SyBrowser 6.2</a> 
<div xmlns="http://www.w3.org/1999/xhtml">Dr. Gerard Hammond of MacSOS announced the release of SyBrowser 6.2, a Macintosh application that can query Sybase, FrontBase, PostgreSQL, Oracle, ODBC and MS SQL databases hosted on OSX, UNIX, Linux, and Windows servers. <br><br>SyBrowser v6.2 features include: <br><br>- Added FrontBase database support. <br>- Added "Bachman" style ERD features (Tridents for 'Many' arms of a relationship, open circles for optional entities) <br>- The arms of a relationship now track their entities correctly in all directions. <br>- The arm of the selected relationship can be moved using the mouse or the keyboard <br>- Fixed bug with SQL auto-completion popup with multiple monitors. <br>- Enhanced the "Edit Relationships Info..." dialog. This dialog allows the properties of the selected relationship to be edited. <br>- The mouse cursor changes to reflect the draggable direction when resizing ERD tables, or dragging the various arms of a relationship. The selected arm of the selected relationship now has a circle for a handle. <br>- Documentation added. <br>- Printing the ERD panel has been improved. <br>- The Find dialog allows searching the returned datasets on the SQL panel and Results windows as well as the code in Sybase stored procedures. <br><br>SyBrowser Overview <br>SyBrowser is a table browser and alternative "isql" client for Sybase databases. It facilitates SQL generation thorough a point and click interface. SyBrowser also provides an overview of the tables in ODBC, MySQL, Oracle, FrontBase, PostgreSQL and MS SQL databases. Complex queries can be saved to disk for reuse. An ERD module allows the creation of visual representations of data models. <br><br>$89 Shareware from MacSOS, Australia <br>$49 upgrade from any previous version <br><br><a href="http://www.macsos.com.au/">http://www.macsos.com.au</a> </div>
<div align="right">[via <a href="http://rbgarage.blogspot.com/">RB Garage News Feed</a>]</div>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2004-06-17#562">
  <rss:title>Mozilla and Opera Renew the Browser Battle</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2004-06-17T22:04:41Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">By Kendall Grant Clark, XML.com I now find myself with a wealth of choices, not only on OS X -- where I use a freewheeling mixture of Mozilla, Safari, and Firefox daily -- but also on Linux. Windows users who continue to use Internet Explorer fall into one of several camps: they either don&#39;t know or don&#39;t care about web standards and compliance thereto; or they can&#39;t tell the difference between a bloated piece of software and a quality piece of software; or they can tell, but that difference is of no importance to them. If they don&#39;t know or care about IE&#39;s many defects, why should I? Because there are so many of them! In the ideal world technology standards would unify, rationalize, and perhaps create new markets. While this kind of positive benefit is sometimes achieved by bodies like ISO, W3C, and OASIS, in the real world, given Microsoft&#39;s total domination of desktop computing, that its browser does not excel ends up being not only a pain for users but also a pain for developers and publishers. http://www.xml.com/pub/a/2004/06/16/deviant.html</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<font size="2">
<p>By Kendall Grant Clark, <a href="http://www.xml.com">XML.com</a></p>
<p>I now find myself with a wealth of choices, not only on OS X -- where I use a freewheeling mixture of Mozilla, Safari, and Firefox daily -- but also on Linux. Windows users who continue to use Internet Explorer fall into one of several camps: they either don&#39;t know or don&#39;t care about web standards and compliance thereto; or they can&#39;t tell the difference between a bloated piece of software and a quality piece of software; or they can tell, but that difference is of no importance to them. If they don&#39;t know or care about IE&#39;s many defects, why should I? Because there are so many of them! In the ideal world technology standards would unify, rationalize, and perhaps create new markets. While this kind of positive benefit is sometimes achieved by bodies like ISO, W3C, and OASIS, in the real world, given Microsoft&#39;s total domination of desktop computing, that its browser does not excel ends up being not only a pain for users but also a pain for developers and publishers.</p>
<p><a href="http://www.xml.com/pub/a/2004/06/16/deviant.html"><u><font color="#0000ff" size="2">http://www.xml.com/pub/a/2004/06/16/deviant.html</font></u></a></p></font>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2004-05-27#552">
  <rss:title>Open Source PABX System + P2P VOIP (musings)</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2004-05-28T01:17:16Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Asterisk (discovered via this Jon Udell post) is a complete PBX in software. It runs on Linux and provides all of the features you would expect from a PBX and more. Quoting from the Asterisk home page: Asterisk does voice over IP in three protocols, and can interoperate with almost all standards-based telephony equipment using relatively inexpensive hardware. Asterisk provides Voicemail services with Directory, Call Conferencing, Interactive Voice Response, Call Queuing. It has support for three-way calling, caller ID services, ADSI, SIP and H.323 (as both client and gateway). Check the Features section for a more complete list. Naturally, this got me thinking about Skype; could Asterik and Skpe be meshed into something out of this world (Sykype, WiFi, and Asterisk)? But Skype isn&#39;t Open Source, so this would have to be something the Skype team would want to embark upon I guess? As I pondered I searched further, and stumbled across this Open Source competitor of</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p><a href="http://www.asterisk.org/">Asterisk</a> (discovered via <a href="http://weblog.infoworld.com/udell/2004/05/26.html#a1009">this</a> Jon Udell post) is a complete PBX in software. It runs on Linux and provides all of the features you would expect from a PBX and more. </p>
<p>Quoting from the Asterisk home page:</p>
<blockquote dir="ltr" style="MARGIN-RIGHT: 0px">
<p>Asterisk does voice over IP in three protocols, and can interoperate with almost all standards-based telephony equipment using relatively inexpensive hardware. </p>
<p>Asterisk provides Voicemail services with Directory, Call Conferencing, Interactive Voice Response, Call Queuing. It has support for three-way calling, caller ID services, ADSI, SIP and H.323 (as both client and gateway). </p>
<p>Check the <a href="http://www.asterisk.org/index.php?menu=features">Features</a> section for a more complete list.</p></blockquote>
<p>Naturally, this got me thinking about Skype; could Asterik and Skpe be meshed into something out of this world (Sykype, WiFi, and Asterisk)? But Skype isn&#39;t Open Source, so this would have to be something the Skype team would want to embark upon I guess? </p>
<p>As I pondered I searched further, and stumbled across this Open Source competitor of</p>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2004-05-14#543">
  <rss:title>Collaboration Software</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2004-05-14T23:39:35Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Dare Obasanjo points out that Microsoft Sharepoint offers &quot;by reference&quot; as opposed to &quot;by value&quot; mail attachment capability that Jon UdellÂ reviewedÂ in a recent blog post,Â true! So does Virtuoso in a number of ways (most importantly independent ofÂ client or serverÂ operating system). This issue really brings WebDAV into scope as this is the protocol that enables this capability (as covered by Jon&#39;s piece), and it is one of the many client and server side protocols implemented by OpenLink VirtuosoÂ (the key to how Virtuoso delivers URI based SQL-XML, XQuery, XPathÂ services). When you install Virtuoso you simply have to start the Virtuoso server instanceÂ to the get WebDAV functionality going. All of Virtuoso&#39;s services are advertised at ports, and in the case of WebDAV you will find this at port 8890 if you start the demo database. To exploit the Virtuoso/WebDAV server from any WebDAV client (or point urls at WebDAV hosted resources) simply do the following: Install Virtuoso and depending on your OS do the following: Windows - create a Web Folder that points to a WebDAV server Mac OS X - mount a WebDAV folder Linux - mount a WebDAV directoryÂ (also see the Davfs2 Open Source project) You can also make WebDAV client calls from Virtuoso&#39;s Stored Procedure Language (Virtuoso PL) or use WebDAV implementations in any development environment of your choice (.NET, Java, . Place content that you want to reference in your mails in your WebDAV repository via any of the client side mechanisms described in step 1. You can see the results of this in my earlier blog post, even better pass the url on in an email! Or browse the WebDAV folder (there are some nuggets deliberately left in place :-) ) You could simply save an Office Doc (powerpoint, excel, word etc)Â to this location and the circulate urls in your mails (this has been standard practice at OpenLink for many years; we even have a full blown portal server that would soon be available as a public service to sharing anything via DAV and as usual some more... stay tuned) That&#39;s it for any platform (Windows, Linux, Mac OS X, FreeBSD, Solaris, AIX, HP-UX etc.) once you install Virtuoso! BTW - This blog is WebDAV based (it&#39;s a live instance of Virtuoso doing many things; WebDAV, HTTP, SQL-XML based feed generation for ATOM, RSS, Blog Post APIs support (Moveable Type, Metaweblog, Blogger, ATOM), Free Text, XPath, XQuery, and more).Â </dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p dir="ltr"><a href="http://www.25hoursaday.com/weblog/PermaLink.aspx?guid=d2312299-0c0d-497b-9268-4b124f61f801">Dare Obasanjo</a> points out that Microsoft Sharepoint offers &quot;by reference&quot; as opposed to &quot;by value&quot; mail attachment capability that <a href="http://www.infoworld.com/article/04/02/27/09TCxythos_1.html">Jon UdellÂ reviewedÂ </a>in a recent blog post,Â true! So does Virtuoso in a number of ways (most importantly independent ofÂ client or serverÂ operating system).</p>
<p dir="ltr">This issue really brings WebDAV into scope as this is the protocol that enables this capability (as covered by Jon&#39;s piece), and it is one of the many client and server side protocols implemented by <a href="http://www.openlinksw.com/virtuoso/whatis.htm">OpenLink Virtuoso</a>Â (the key to how Virtuoso delivers URI based SQL-XML, XQuery, XPathÂ services). </p>
<p dir="ltr">When you install Virtuoso you simply have to start the Virtuoso server instanceÂ to the get WebDAV functionality going. All of Virtuoso&#39;s services are advertised at ports, and in the case of WebDAV you will find this at port 8890 if you start the demo database. </p>
<p dir="ltr">To exploit the Virtuoso/WebDAV server from any WebDAV client (or point urls at WebDAV hosted resources) simply do the following:</p>
<ol dir="ltr">
<li>
<div>Install Virtuoso and depending on your OS do the following:</div></li>
<ul>
<li>
<div>Windows - create a <a href="http://support.openlinksw.com/support/tutorials.vsp?c=Web+Server">Web Folder </a>that points to a WebDAV server</div></li>
<li>
<div>Mac OS X - <a href="http://developer.apple.com/technotes/tn/tn2043.html">mount a WebDAV</a> folder</div></li>
<li>
<div>Linux - mount a <a href="http://www.sfu.ca/acs/linux/webdav-linux.html">WebDAV directory</a>Â (also see the <a href="http://dav.sourceforge.net/">Davfs2</a> Open Source project)</div></li>
<li>
<div>You can also make WebDAV client calls from Virtuoso&#39;s Stored Procedure Language (Virtuoso PL) or use WebDAV implementations in any development environment of your choice (<a href="http://www.independentsoft.de/webdav/">.NET</a>, <a href="http://sourceforge.net/projects/skunkdav/">Java</a>, .<br /></div></li></ul>
<li>
<div>Place content that you want to reference in your mails in your WebDAV repository via any of the client side mechanisms described in step 1. You can see the results of this in my earlier <a href="http://www.openlinksw.com/weblogs/virtuoso/index.vspx?id=505">blog post</a>, even better pass the <a href="http://kingsleydemo.openlinksw.com:8890/rtmhosting/99bottles.php">url </a>on in an email! Or browse the <a href="http://kingsleydemo.openlinksw.com:8890/rtmhosting/">WebDAV folder </a>(there are some nuggets deliberately left in place :-) )<br /></div></li>
<ul>
<li>
<div>You could simply save an Office Doc (<a href="http://kingsleydemo.openlinksw.com:8890/rtmhosting/webDADWWW2004.ppt">powerpoint</a>, excel, word etc)Â to this location and the circulate urls in your mails (this has been standard practice at OpenLink for many years; we even have a full blown portal server that would soon be available as a public service to sharing anything via DAV and as usual some more... stay tuned)<br /></div></li></ul>
<li>
<div>That&#39;s it for any platform (Windows, Linux, Mac OS X, FreeBSD, Solaris, AIX, HP-UX etc.) once you install Virtuoso!</div></li></ol>
<p>BTW - This blog is WebDAV based (it&#39;s a live instance of Virtuoso doing many things; WebDAV, HTTP, SQL-XML based feed generation for ATOM, RSS, Blog Post APIs support (Moveable Type, Metaweblog, Blogger, ATOM), Free Text, XPath, XQuery, and more).Â  </p>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2004-04-30#535">
  <rss:title>GUIs and XML Configuration Data: A Look at the Use of XML in Mac OS X and KDE</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2004-04-30T22:25:43Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">David Mertz, IBM developerWorks Over time, XML has permeated many niches. One area where XML is used increasingly is in the configuration of graphical user interfaces, especially in elements that are persistent but should not be fixed at compile-time. In this installment, the author looks at the use of XML in Mac OS X&#39;s Aqua GUI, and in the K Desktop Environment (KDE) which is either standard or available in most modern Linux distributions. So far, the use of XML in configuring modern GUIs is a bit haphazard. Most interfaces use XML in some places, but other mechanisms elsewhere. But it&#39;s clear that the general movement is toward XML. Clearly, Mac OS X Aqua and KDE each have their own XML philosophy. Mac OS X uses solely XML elements that correspond to broad data types, while everything that is really application-specific or GUI-specific is shunted off into the PCDATA content of container elements. In contrast, KDE&#39;s XML feels very usage-specific. http://www-106.ibm.com/developerworks/xml/library/x-matters34.html ----------------------------------------------------------------------</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<font size="2">
<p>David Mertz, IBM developerWorks</p>
<p>Over time, XML has permeated many niches. One area where XML is used increasingly is in the configuration of graphical user interfaces, especially in elements that are persistent but should not be fixed at compile-time. In this installment, the author looks at the use of XML in Mac OS X&#39;s Aqua GUI, and in the K Desktop Environment (KDE) which is either standard or available in most modern Linux distributions. So far, the use of XML in configuring modern GUIs is a bit haphazard. Most interfaces use XML in some places, but other mechanisms elsewhere. But it&#39;s clear that the general movement is toward XML. Clearly, Mac OS X Aqua and KDE each have their own XML philosophy. Mac OS X uses solely XML elements that correspond to broad data types, while everything that is really application-specific or GUI-specific is shunted off into the PCDATA content of container elements. In contrast, KDE&#39;s XML feels very usage-specific.</p>
<p><a href="http://www-106.ibm.com/developerworks/xml/library/x-matters34.html"><u><font color="#0000ff" size="2">http://www-106.ibm.com/developerworks/xml/library/x-matters34.html</font></u></a></p><font size="2">
<p>----------------------------------------------------------------------</p></font></font>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2004-04-07#504">
  <rss:title>621 variations of The &quot;99 Bottles of Beer&quot; programming puzzle</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2004-04-07T23:48:39Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">621 variations of the &quot;99 Bottles of Beer&quot; programming puzzle implemented across a plethora of programming languages. Cool! As I completed this post a bell went off! Why not use this for a quick live demo of Virtuoso&#39;s hosting capabilities? Starting off with something simple like PHP for instance? So, I quickly did the following: Cut and pasted the PHP version of this programming puzzle into a text file (using notepad) Copy and pasted from my Windows Directory to my Virtuoso WebDAV directories on our Windows and Linux Virtuoso Demo Servers. I achieved this by creating Web Folders (Windows OS level</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p><a href="http://www.99-bottles-of-beer.net//">621 variations of the &quot;99 Bottles of Beer&quot; programming puzzle</a> implemented across a plethora of programming languages. Cool!</p>
<p>As I completed this post a bell went off! Why not use this for a quick live demo of <a href="http://www.openlinksw.com/virtuoso/whatis.htm">Virtuoso&#39;s hosting capabilities</a>? Starting off with something simple like PHP for instance?</p>
<p>So, I quickly did the following:</p>
<ol>
<li>Cut and pasted the PHP version of this programming puzzle into a text file (using notepad) </li>
<li>Copy and pasted from my Windows Directory to my Virtuoso WebDAV directories on our Windows and Linux Virtuoso Demo Servers. I achieved this by creating Web Folders (Windows OS level</li></ol>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2004-03-23#482">
  <rss:title>Demo Hell and back</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2004-03-23T20:04:04Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">This piece links to a great Mono presentation (bar the reference placement of MySQL/PostgreSQL in a box somewhat adjacent to ADO.NET (see slide 7). When ADO.NET should have be associated with Data Providers for ODBC, MySQL, PostgresSQL, and others for clarity (the natural goal of the presentation). We have got to take time to understand the Data Access Layer, if we don&#39;t we will utlimately pay a hefty price (IMHO). This blog post is also hillarious, especially if you have encountered the mercurial &quot;Murphy&quot; during live product demos. So, today I went to hell. And then I came back. It was a short trip. This year, I am giving a presentation on Mono at Brainshare in Salt Lake City, an intro to Mono for developers. I got a pretty good turnout with a few ximian people in the back (including Joe whom I saw for the first time without a hat).   So I plug in my PowerBook 12&quot; as I always do but for some reason I have a hard time getting the projector to display its output. After struggling a little I resort to using the desktop provided by Novell, running Ximian Desktop 2 (and some version Suse Linux). So I upload my presentation to www.frenchguys.com from my mac and then download it back to the desktop. Now I can make my presentation, which goes well. Then I get to a slide that just says : DEMO. Hmmm. Demo. I don&#39;t have Mono installed on that generic machine I was just given. I am going to need magic. So to magic I resort. [via Monologue]</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p>This piece links to a great <a href="http://www.frenchguys.com/temp/Mono.ppt">Mono presentation</a>&nbsp;(bar the reference&nbsp;placement of&nbsp;MySQL/PostgreSQL in a box somewhat adjacent to ADO.NET (see slide 7). When ADO.NET should have be associated with Data Providers for ODBC, MySQL, PostgresSQL, and others for clarity (the natural goal of the presentation).</p>
<p>We have got to take time to understand the Data Access Layer, if we don't we will utlimately <a href="http://www.securityfocus.com/archive/1/358200">pay a hefty price </a>(IMHO).</p>
<p>This blog post is also hillarious, especially if you have encountered the mercurial "Murphy" during live product demos.</p>
<blockquote dir="ltr" style="MARGIN-RIGHT: 0px">
<p>So, today I went to hell. And then I came back. It was a short trip.</p>
<p>This year, I am giving a presentation on Mono at Brainshare in Salt Lake City, an intro to Mono for developers. I got a pretty good turnout with a few ximian people in the back (including Joe whom I saw for the first time without a hat).</p></blockquote>
<p dir="ltr">&nbsp;</p>
<blockquote dir="ltr" style="MARGIN-RIGHT: 0px">
<p>So I plug in my PowerBook 12" as I always do but for some reason I have a hard time getting the projector to display its output. After struggling a little I resort to using the desktop provided by Novell, running Ximian Desktop 2 (and some version Suse Linux).</p>
<p>So I upload my <a href="http://www.frenchguys.com/temp/Mono.ppt" target="_blank">presentation</a> to <a href="http://www.frenchguys.com/" target="blank">www.frenchguys.com</a> from my mac and then download it back to the desktop. Now I can make my presentation, which goes well. Then I get to a slide that just says : <b>DEMO</b>. Hmmm. Demo. I don't have Mono installed on that generic machine I was just given. I am going to need magic. So to magic I resort.</p></blockquote>
<p align="right">[via <a href="http://go-mono.com/monologue">Monologue</a>]</p>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2004-01-06#442">
  <rss:title>Enterprise Databases get a grip on XML</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2004-01-06T23:17:07Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Databases get a grip on XMLFrom Inforworld.The next iteration of the SQL standard was supposed to arrive in 2003. But SQL standardization has always been a glacially slow process, so nobody should be surprised that SQL:2003 ? now known as SQL:200n ? isn?t ready yet. Even so, 2003 was a year in which XML-oriented data management, one of the areas addressed by the forthcoming standard, showed up on more and more developers? radar screens.ÃÂ  &gt;&gt; READ MORE This article rounds up product for 2003 in the critical area of Enterprise Database Technology. It&#39;s certainly provides an apt reflection of how Virtuoso compares with offerings from some the larger (but certainly slower to implement) database vendors in this space. As usual Jon Udell&#39;s quote pretty much sums this up: &quot;While the spotlight shone on the heavyweight contenders, a couple of agile innovators made noteworthy advances in 2003. OpenLink Software?s Virtuoso 3.0, which we reviewed in March, stole thunder from all three major players. Like Oracle, it offers a WebDAV-accessible XML repository. Like DB2 Information Integrator, it functions as database middleware that can perform federated ?joins? across SQL and XML sources. And like the forthcoming Yukon, it embeds the .Net CLR (Common Language Runtime), or in the case of Linux, Novell/Ximian?s Mono.&quot; Albeit still somewhat unknown to the broader industry we have remained true our &quot;innovator&quot; discipline, which still remains our chosen path to market leadership. Thus, its worth a quick Virtuoso release history, and featuresÃÂ recap as we get set to up the ante even further in 2004: 1998 - Virtuoso&#39;s initial public beta release with functional emphasis on Virtual Database Engine for ODBC and JDBC Data Sources. 1999 - Virtuoso&#39;s official commercial release, with emphasis stillÃÂ on Virtual Database functionality for ODBC, JDBC accessible SQL Databases. 2000 - Virtuoso 2.0 adds XML Storage, XPath, XML Schema, XQuery, XSL-T, WebDAV, SOAP, UDDI, HTTP, Replication, Free Text Indexing (*feature update*), POP3, and NNTP support. 2002 - Virtuoso 2.7 extends Virtualization prowess beyond data access via enhancements to its Web Services protocol stack implementation by enabling SQL Stored Procedures to be published as Web Services. It also debutsÃÂ its Object-Relational engine enhancements that include theÃÂ incorporation of Java and Microsoft .NET Objects into its User Defined Type, User Defined Functions, and Stored ProcedureÃÂ offerings. 2003 - Virtuoso 3.0 extends data and application logic virtualization into the Application Server realm (basically a Virtual Application server too!), by adding support for ASP.NET, PHP, Java Server Pages runtime hosting (making applications built using any of these languages deployable using Virtuoso across all supported platforms). Collectively each of these releases have contributed to a very premeditated architecture and vision that will ultimately unveil the inherent power of critical I.S infrastructure virtualizationÃÂ along the following lines; data storage, data access , and application logic via coherent integration of SQL, XML, Web Services, and Persistent Stored Modules (.NET, Java, and other object based component building blocks). ÃÂ </dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[
<blockquote style="margin-right: 0px;" dir="ltr"> <p><a class="listLinkLrg" title="http://newsletter.infoworld.com/t?ctl=4FEDB6:1F3948D" href="http://newsletter.infoworld.com/t?ctl=4FEDB6:1F3948D" target="_new"><strong><font face="Verdana">Databases get a grip on XML</font></strong></a><br /><font size="2"></font><font face="Verdana">From <a href="http://newsletter.infoworld.com/t?ctl=4FEDB6:1F3948D">Inforworld</a>.</font><br /><br /><font face="Verdana,Geneva,Arial,sans-serif" size="2">The
next iteration of the SQL standard was supposed to arrive in 2003. But
SQL standardization has always been a glacially slow process, so nobody
should be surprised that SQL:2003 ? now known as SQL:200n ? isn?t ready
yet. Even so, 2003 was a year in which XML-oriented data management,
one of the areas addressed by the forthcoming standard, showed up on
more and more developers? radar screens.ÃÂ  <a title="http://newsletter.infoworld.com/t?ctl=4FEDB6:1F3948D" href="http://newsletter.infoworld.com/t?ctl=4FEDB6:1F3948D" target="_blank">&gt;&gt; READ MORE</a></font></p></blockquote> <p dir="ltr"><font face="Verdana" size="2">This
article rounds up product for 2003 in the critical area of Enterprise
Database Technology. It&#39;s certainly provides an apt reflection of how
Virtuoso compares with offerings from some the larger (but certainly
slower to implement) database vendors in this space. As usual Jon
Udell&#39;s quote pretty much sums this up:</font></p> <blockquote style="margin-right: 0px;" dir="ltr"> <p dir="ltr"><!--StartFragment --><span class="artText"><em>&quot;While the spotlight shone on the heavyweight contenders, a couple of agile innovators made noteworthy advances in 2003. </em><a class="regularArticleU" href="http://www.infoworld.com/699"><em>OpenLink Software?s Virtuoso 3.0</em></a><em>,
which we reviewed in March, stole thunder from all three major players.
Like Oracle, it offers a WebDAV-accessible XML repository. Like DB2
Information Integrator, it functions as database middleware that can
perform federated ?joins? across SQL and XML sources. And like the
forthcoming Yukon, it embeds the .Net CLR (Common Language Runtime), or
in the case of Linux, Novell/Ximian?s Mono.&quot;</em></span> </p></blockquote> <p dir="ltr"><font face="Verdana" size="2">Albeit
still somewhat unknown to the broader industry we have remained true
our &quot;innovator&quot; discipline, which still remains our chosen path to
market leadership. Thus, its worth a quick Virtuoso release history,
and featuresÃÂ recap as we get set to up the ante even further in
2004:</font></p> <p dir="ltr"><font face="Verdana" size="2"><a href="http://www.openlinksw.com/press/virtuoso.htm">1998 - Virtuoso&#39;s initial public beta</a> release with functional emphasis on Virtual Database Engine for ODBC and JDBC Data Sources.</font></p> <p dir="ltr"><font face="Verdana" size="2"><a href="http://www.openlinksw.com/press/virtuoso1.htm">1999 - Virtuoso&#39;s official commercial</a> release, with emphasis stillÃÂ on Virtual Database functionality for ODBC, JDBC accessible SQL Databases.</font></p> <p dir="ltr"><font face="Verdana" size="2"><a href="http://www.openlinksw.com/press/v2releas.htm">2000 - Virtuoso 2.0</a>
adds XML Storage, XPath, XML Schema, XQuery, XSL-T, WebDAV, SOAP, UDDI,
HTTP, Replication, Free Text Indexing (*feature update*), POP3, and
NNTP support.</font></p> <p dir="ltr"><font face="Verdana" size="2"><a href="http://www.openlinksw.com/press/v27releas.htm">2002 - Virtuoso 2.7</a>
extends Virtualization prowess beyond data access via enhancements to
its Web Services protocol stack implementation by enabling SQL Stored
Procedures to be published as Web Services. It also debutsÃÂ its
Object-Relational engine enhancements that include
theÃÂ incorporation of Java and Microsoft .NET Objects into its User
Defined Type, User Defined Functions, and Stored
ProcedureÃÂ offerings.</font></p> <p dir="ltr"><font face="Verdana" size="2"><a href="http://www.openlinksw.com/press/virt3beta.htm">2003 - Virtuoso 3.0</a>
extends data and application logic virtualization into the Application
Server realm (basically a Virtual Application server too!), by adding
support for ASP.NET, PHP, Java Server Pages runtime hosting (making
applications built using any of these languages deployable using
Virtuoso across all supported platforms).</font></p> <p dir="ltr"><font face="Verdana" size="2">Collectively
each of these releases have contributed to a very premeditated
architecture and vision that will ultimately unveil the inherent power
of critical I.S infrastructure virtualizationÃÂ along the following
lines; data storage, data access , and application logic via coherent
integration of SQL, XML, Web Services, and Persistent Stored Modules
(.NET, Java, and other object based component building blocks).</font></p> <p dir="ltr"><font face="Verdana"></font>ÃÂ </p>
]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-12-02#433">
  <rss:title>Deploying .NET on Mac OS X Inches closer</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-12-03T03:49:43Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">02 Dec 2003: Mono 0.29 has been released This release took us a long time to go out, but it is pretty exciting, with PPC supported. The best Mono release ever! [via Monologue] This time last year Mono enabled us to deliver a release of Virtuoso that unveiled the power of .NET integration as a database extension mechanism on Windows and Linux along the following lines; User Defined Types, User Defined Functions, and Stored Procedures using any .NET bound language. It also enabled the deployment of ASP.NET applications on Linux, and on Windows without IIS. One item missing from my check list at the time was a Virtuoso release for Mac OS X with identical functionality. This announcement implies we are within striking distance of a Virtuoso 3.2 release that enables .NET classes and frameworks utilization (along the lines described above) on Mac OS X.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<BLOCKQUOTE dir=ltr style="MARGIN-RIGHT: 0px">
<P><A href="http://primates.ximian.com/~miguel/all.html#12%2F02%2F2003+12%3A00%3A00">02 Dec 2003: Mono 0.29 has been released</A> </P>
<P>This release took us a long time to go out, but it is pretty exciting, with PPC supported. The best Mono release ever! [via <A href="http://monologue.go-mono.com/">Monologue</A>]</P></BLOCKQUOTE>
<P dir=ltr>This time <A href="http://www.ximian.com/about_us/press_center/press_releases/index.html?pr=openlink_mono">last year </A>Mono enabled us to deliver a release of<A href="http://www.openlinksw.com/virtuoso"> Virtuoso </A>that unveiled the power of .NET integration as a database extension mechanism on Windows and Linux along the following lines; <A href="http://demo.openlinksw.com:8890/tutorial">User Defined Types, User Defined Functions, and Stored Procedures using any .NET bound language</A>. It also enabled the deployment of ASP.NET applications on Linux, and on Windows without IIS. One item missing from my check list at the time was a Virtuoso release for Mac OS X with identical functionality.
<P dir=ltr>This announcement implies we are within striking distance of a Virtuoso 3.2 release that enables .NET classes and frameworks utilization (along the lines described above) on Mac OS X.</P>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-10-23#395">
  <rss:title>A Virtuoso of a Server</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-10-23T21:57:48Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">NETWORK WORLD NEWSLETTER: MARK GIBBS ON WEB APPLICATIONS Today&#39;s focus: A Virtuoso of a server By Mark Gibbs One of the bigger drags of Web applications development is that building a system of even modest complexity is a lot like herding cats - you need a database, an applications server, an XML engine, etc., etc. And as they all come from different vendors you are faced with solving the constellation of integration issues that inevitably arise. If you are lucky, your integration results in a smoothly functioning system. If not, you have a lot of spare parts flying in loose formation with the risk of a crash and burn at any moment. An alternative is to look for all of these features and services in a single package but you&#39;ll find few choices in this arena. One that is available and looks very promising is OpenLink&#39;s Virtuoso (see links below). Virtuoso is described as a cross platform (runs on Windows, all Unix flavors, Linux, and Mac OS X) universal server that provides databases, XML services, a Web application server and supporting services all in a single package. OpenLink&#39;s list of supported standards is impressive and includes .Net, Mono, J2EE, XML Web Services (Simple Object Application Protocol, Web Services Description Language, WS-Security, Universal Description, Discovery and Integration), XML, XPath, XQuery, XSL-T, WebDav, HTTP, SMTP, LDAP, POP3, SQL-92, ODBC, JDBC and OLE-DB. Virtuoso provides an HTTP-compliant Web Server; native XML document creation, storage and management; a Web services platform for creation, hosting and consumption of Web services; content replication and synchronization services; free text index server, mail delivery and storage and an NNTP server. Another interesting feature is that with Virtuoso you can create Web services from existing SQL Stored Procedures, Java classes, C++ classes, and &#39;C&#39; functions as well as create dynamic XML documents from ODBC and JDBC data sources. This is an enormous product and implies a serious commitment on the part of adopters due to its scope and range of services. Virtuoso is enormous by virtue of its architectural ambitions, but actual disk requirements are</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<font size="2">
<p><a href="http://www.nwfusion.com/index.html">NETWORK WORLD</a> NEWSLETTER: MARK GIBBS ON WEB APPLICATIONS </p>
<p><font size="2">Today&#39;s focus: A Virtuoso of a server</font></p>
<p>By <a href="http://www.nwfusion.com/columnists/gibbs.html">Mark Gibbs</a></p>
<p>One of the bigger drags of Web applications development is that building a system of even modest complexity is a lot like herding cats - you need a database, an applications server, an XML engine, etc., etc. And as they all come from different vendors you are faced with solving the constellation of integration issues that inevitably arise.</p>
<p>If you are lucky, your integration results in a smoothly functioning system. If not, you have a lot of spare parts flying in loose formation with the risk of a crash and burn at any moment.</p>
<p>An alternative is to look for all of these features and services in a single package but you&#39;ll find few choices in this arena.</p>
<p>One that is available and looks very promising is OpenLink&#39;s Virtuoso (see links below).</p>
<p>Virtuoso is described as a cross platform (runs on Windows, all Unix flavors, Linux, and Mac OS X) universal server that provides databases, XML services, a Web application server and supporting services all in a single package.</p>
<p>OpenLink&#39;s list of supported standards is impressive and includes .Net, Mono, J2EE, XML Web Services (Simple Object Application Protocol, Web Services Description Language, WS-Security, Universal Description, Discovery and Integration), XML, XPath, XQuery, XSL-T, WebDav, HTTP, SMTP, LDAP, POP3, SQL-92, ODBC, JDBC and OLE-DB.</p>
<p>Virtuoso provides an HTTP-compliant Web Server; native XML document creation, storage and management; a Web services platform for creation, hosting and consumption of Web services; content replication and synchronization services; free text index server, mail delivery and storage and an NNTP server.</p>
<p>Another interesting feature is that with Virtuoso you can create Web services from existing SQL Stored Procedures, Java classes,</p>
<p>C++ classes, and &#39;C&#39; functions as well as create dynamic XML</p>
<p>documents from ODBC and JDBC data sources.</p>
<p>This is an enormous product and implies a serious commitment on the part of adopters due to its scope and range of services.</p>
<blockquote dir="ltr" style="MARGIN-RIGHT: 0px">
<p><em>Virtuoso is enormous by virtue of its architectural ambitions, but actual disk requirements are</em></p></blockquote></font>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-08-05#232">
  <rss:title>Howl is Rendezvous for Windows and Linux</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-08-05T19:18:55Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Very interesting, we have basically ported Zeroconfig as released by Apple (in Open Source) too, and used it in both our Virtuoso 3.x and UDA 5.x products. Howl is Rendezvous for Windows and Linux. [via Scripting News] In the case of UDA you can configure ODBC and JDBC consumable data source names that are hosted on the server. Users can nownbspsimply picknbspDSNs from anbspcombo box and they are ready to make connections to remote databases from any ODBC, JDBC, OLE DB, or ADO.NET application.nbspAnother benefit ofnbspZeroconfignbspis that it facilitates centralized server side configuration which further enhances our server side session rules book;nbspwhich serves all our Multi-Tier data access drivers. In the case of Virtuoso you are able to bind to pre-configured Virtuoso instances in exactly the same way. Our Zeroconfig support has beennbspimplemented across Solaris, AIX, Digital UNIX, IRIX, HP-UX amongst others, but this is a project of interest all the same, and we may end up contributing to this effort.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p dir="ltr">Very interesting, we have basically ported Zeroconfig as released by Apple (in Open Source) too, and used it in both our <a href="http://www.openlinksw.com/virtuoso/whatis.htm">Virtuoso</a> 3.x and <a href="http://www.openlinksw.com/product.htm">UDA</a> 5.x products.</p>
<blockquote dir="ltr" style="MARGIN-RIGHT: 0px">
<p><a href="http://www.swampwolf.com/products/">Howl</a> is Rendezvous for Windows and Linux. [via <a href="http://www.scripting.com/">Scripting News</a>]</p></blockquote>
<p dir="ltr">In the case of UDA you can configure ODBC and JDBC consumable data source names that are hosted on the server. Users can nownbspsimply picknbspDSNs from anbspcombo box and they are ready to make connections to remote databases from any ODBC, JDBC, OLE DB, or ADO.NET application.nbspAnother benefit ofnbspZeroconfignbspis that it facilitates centralized server side configuration which further enhances our server side session rules book;nbspwhich serves all our Multi-Tier data access drivers.</p>
<p dir="ltr">In the case of Virtuoso you are able to bind to pre-configured Virtuoso instances in exactly the same way.</p>
<p dir="ltr">Our Zeroconfig support has beennbspimplemented across Solaris, AIX, Digital UNIX, IRIX, HP-UX amongst others, but this is a project of interest all the same, and we may end up contributing to this effort.</p>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-07-07#202">
  <rss:title>eBay Will Someday Buy Oracle?</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-07-07T20:51:56Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">O&#39;Reilly on the Commoditization of Software Certinaly an interesting proposition, or should I say vision, but I don&#39;t think this proposition does justice to some of the valid insights contained in this recent IDG interview with Tim O&#39;Reilly. Here are some of Tim&#39;s quotes: &quot;Nobody is pointing out something that I think is way more significant: all of the killer apps of the Internet era: Amazon (.com, Inc), Google (Inc.), and Maps.yahoo.com. They run on Linux or FreeBSD, but they&#39;re not apps in the way that people have traditionally thought of applications, so they just don&#39;t get considered. Amazon is built with Perl on top of Linux. It&#39;s basically a bunch of open source hackers, but they&#39;re working for a company that&#39;s as fiercely proprietary as any proprietary software company.&quot; Solutions are always more important that the technology that makes up the solutions from a business development perspective. The trouble is that the constituent parts of a solution ultimately affect the longevity of the solution (the future adaptability of the solution), hence the middleware and components segments of the software industry. &quot;With eBay it&#39;s even clearer. The fact is, it&#39;s the critical mass of marketplace buyers and sellers and all the information that people have put in that marketplace as a repository.&quot;&quot;So I think we&#39;re going to find more and more places where that happens, where somebody gets a critical mass of customers and data and that becomes their source of value. On that basis, I will predict that -- this is an outrageous prediction -- but eBay will buy Oracle someday. The value will have moved so much to people who are not now seen as software suppliers.&quot; In reading this article that I can only assume that Tim does realize the inevitable; computing is, and always will be about data -- creation, transformation, dissemination, and exploitation. That said, you don&#39;t maximize the opportunities that such a realization accords by acquiring the largest vendor of database software. The largest database vendor doesn&#39;t imply dominance in any of the following areas: Data Creation Data Storage Data Access Data Dissemination Data Exploitation I see the Internet as the Database (comprising various forms), and the Web as a dominant database segment within Internet realm. Every Internet Point of Presence is really a point of Data interaction; Creation, Storage, Access, Dissemination, and Exploitation. eBay can acquire a license from Oracle or any other database vendor and still be sucessful, and all they need to do is come to the actual realization that like Amazon and Google they could become a very important Executable and Semantic Web platform by finally understanding that their home page isn&#39;t that important, it&#39;s the interactions with the site that matter. All of this is certainly achievable without acquiring Oracle. In short, this applies to any organization that seeks to incorporate the Internet into their operational strategy (Business Development, Customer Services, Intranets, Extranets etc.). I am inclined to believe that Sofware Commoditization (which has been with us for a very long time) is the new moniker for &quot;its all about data&quot; or to quote Sam Ruby, &quot;It&#39;s just data&quot;.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p><a href="http://slashdot.org/article.pl?sid=03/07/04/1955241">O&#39;Reilly on the Commoditization of Software</a> </p>
<p>Certinaly an interesting proposition, or should I say vision, but I don&#39;t think this proposition does justice to some of the valid insights contained in this recent <a href="http://www.idg.se/ArticlePages/idgnet.asp?id=4635">IDG interview </a>with <a href="http://tim.oreilly.com/">Tim O&#39;Reilly</a>. Here are some of Tim&#39;s quotes:</p>
<blockquote dir="ltr" style="MARGIN-RIGHT: 0px">
<p><em>&quot;Nobody is pointing out something that I think is way more significant: all of the killer apps of the Internet era: Amazon (.com, Inc), Google (Inc.), and Maps.yahoo.com. They run on Linux or FreeBSD, but they&#39;re not apps in the way that people have traditionally thought of applications, so they just don&#39;t get considered. Amazon is built with Perl on top of Linux. It&#39;s basically a bunch of open source hackers, but they&#39;re working for a company that&#39;s as fiercely proprietary as any proprietary software company.&quot;</em></p></blockquote>
<p dir="ltr">Solutions are always more important that the technology that makes up the solutions from a business development perspective. The trouble is that the constituent parts of a solution ultimately affect the longevity of the solution (the future adaptability of the solution), hence the middleware and components segments of the software industry.</p>
<blockquote dir="ltr" style="MARGIN-RIGHT: 0px">
<p dir="ltr"><em>&quot;With eBay it&#39;s even clearer. The fact is, it&#39;s the critical mass of marketplace buyers and sellers and all the information that people have put in that marketplace as a repository.&quot;<br /><br />&quot;So I think we&#39;re going to find more and more places where that happens, where somebody gets a critical mass of customers and data and that becomes their source of value. On that basis, I will predict that -- this is an outrageous prediction -- but eBay will buy Oracle someday. The value will have moved so much to people who are not now seen as software suppliers.&quot;</em></p></blockquote>
<p>In reading this article that I can only assume that Tim does realize the inevitable; computing is, and always will be about data -- creation, transformation, dissemination, and exploitation. That said, you don&#39;t maximize the opportunities that such a realization accords by acquiring the largest vendor of database software. </p>
<p>The largest database vendor doesn&#39;t imply dominance in any of the following areas:</p>
<ol>
<li>Data Creation </li>
<li>Data Storage</li>
<li>Data Access</li>
<li>Data Dissemination</li>
<li>Data Exploitation</li></ol>
<p>I see the Internet as the Database (comprising various forms), and the Web as a dominant database segment within Internet realm. Every Internet Point of Presence is really a point of Data interaction; Creation, Storage, Access, Dissemination, and Exploitation.</p>
<p>eBay can acquire a license from Oracle or any other database vendor and still be sucessful, and all they need to do is come to the actual realization that like Amazon and Google they could become a very important Executable and Semantic Web platform by finally understanding that their home page isn&#39;t that important, it&#39;s the interactions with the site that matter. All of this is certainly achievable without acquiring Oracle.</p>
<p>In short, this applies to any organization that seeks to incorporate the Internet into their operational strategy (Business Development, Customer Services, Intranets, Extranets etc.). I am inclined to believe that Sofware Commoditization (which has been with us for a very long time) is the new moniker for &quot;its all about data&quot; or to quote <a href="http://www.intertwingly.net/blog/index.rss">Sam Ruby</a>, &quot;It&#39;s just data&quot;.</p>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-25#187">
  <rss:title>OpenLink Software Announces Virtuoso 3.2 </rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-06-25T21:35:54Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">OpenLink Software Announces Virtuoso 3.2 This Blog Site is actually powered by Virtuoso 3.2 (has been doing so prior to the announcement). Hmm. product utilization preceding press release? Why not? OpenLink adds Weblog client and server functionality to Virtual Database Engine for SQL, XML, and Web Services Burlington, MA. June 25, 2003 - OpenLink Software, Inc., a leading provider of universal data access and enterprise information integration middleware, announces Virtuoso 3.2  the latest edition of its cross platform Virtual Database for SQL, XML, and Web Services  for Mac® OS X. The new release incorporates full client and server support for the Blogger, Moveable Type, and MetaWeblog APIs, providing users with choice over location, format, data storage, development environment, and host operating system, for personal, community, and corporate Weblogs. The new release also facilitates the transparent integration of Weblog data with other enterprise data sources. Full Press Release Putting together the community site took 5 minutes and it basically involved the following steps: 1. Standard installation from installer program (Mac OS X in this case, but Windows, Linux, and UNIX supported) 2. Creation of WebDAV user account for WebDAV repository (where all the gems reside) 3. Clicking on the &quot;Generate Web Site&quot; button situated in the Weblog menu tree with the Virtuoso HTML based Admin UI 4. Filled up my channel and blogrolls by asking Virtuoso to use its very old web content aggregation functionality 5. Setup my upstreams (so that I post once and propagate to my numerous blog sites on a conditional basis) 6. Create a Virtuoso HTTP Virtual Domain for the community/personal Blog 7. Start blogging using any Blog Client that supports; Blogger API, MetaWeblog, or Moveable Type No more no less. Most importantly I have a choice of programming languages (VSP, VSX, PHP, ASP.NET, JSP, Perl, Python), operating systems, and databases that constitute the shape and form of my blog home. See the Virtuoso FAQ for how this all comes together.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<P><SPAN style="FONT-SIZE: 10pt; FONT-FAMILY: Arial"><A href="http://www.openlinksw.com/press/virt32_wwdc1.htm">OpenLink Software Announces Virtuoso 3.2 </a></span></p>
<P><SPAN style="FONT-SIZE: 10pt; FONT-FAMILY: Arial">This <A href="http://wwdc2003.openlinksw.com/"><SPAN style="FONT-SIZE: 12pt; FONT-FAMILY: 'Times New Roman'"><FONT face=Arial size=2>Blog Site</font></span></a> is actually powered by <A href="http://www.openlinksw.com/virtuoso">Virtuoso</a> 3.2 (has been doing so prior to the announcement). Hmm. product utilization preceding press release? Why not?</span><B><SPAN style="FONT-FAMILY: Arial"><FONT size=3></font></span></b></p>
<BLOCKQUOTE dir=ltr style="MARGIN-RIGHT: 0px">
<P><B><SPAN style="FONT-FAMILY: Arial">OpenLink adds Weblog client and server functionality to <BR>Virtual Database Engine for SQL, XML, and Web Services</span></b><SPAN style="FONT-SIZE: 10pt; FONT-FAMILY: Arial"> <BR><BR><B>Burlington, MA. June 25, 2003</b> - OpenLink Software, Inc., a leading provider of universal data access and enterprise information integration middleware, announces Virtuoso 3.2  the latest edition of its cross platform Virtual Database for SQL, XML, and Web Services  for Mac® OS X. <BR><BR>The new release incorporates full client and server support for the Blogger, Moveable Type, and MetaWeblog APIs, providing users with choice over location, format, data storage, development environment, and host operating system, for personal, community, and corporate Weblogs. The new release also facilitates the transparent integration of Weblog data with other enterprise data sources. </span></p>
<P><SPAN style="FONT-SIZE: 10pt; FONT-FAMILY: Arial"><A href="http://www.openlinksw.com/press/virt32_wwdc1.htm"><SPAN style="FONT-SIZE: 12pt; FONT-FAMILY: 'Times New Roman'"><FONT face=Arial size=2>Full Press Release</font></span></a></span></p></blockquote>
<P dir=ltr><SPAN style="FONT-SIZE: 10pt; FONT-FAMILY: Arial">Putting together the community site took 5 minutes and it basically involved the following steps:</span></p>
<P dir=ltr><SPAN style="FONT-SIZE: 10pt; FONT-FAMILY: Arial">1. Standard installation from installer program (Mac OS X in this case, but Windows, Linux, and UNIX supported)</span></p>
<P dir=ltr><SPAN style="FONT-SIZE: 10pt; FONT-FAMILY: Arial">2. Creation of WebDAV user account for WebDAV repository (where all the gems reside)</span></p>
<P dir=ltr><SPAN style="FONT-SIZE: 10pt; FONT-FAMILY: Arial">3. Clicking on the "Generate Web Site" button situated in the Weblog menu tree with the Virtuoso HTML based Admin UI</span></p>
<P dir=ltr><SPAN style="FONT-SIZE: 10pt; FONT-FAMILY: Arial">4. Filled up my channel and blogrolls by asking Virtuoso to use its <U>very old web</u> content aggregation functionality </span></p>
<P dir=ltr><SPAN style="FONT-SIZE: 10pt; FONT-FAMILY: Arial">5. Setup my upstreams (so that I post once and propagate to my numerous blog sites on a conditional basis)</span></p>
<P dir=ltr><SPAN style="FONT-SIZE: 10pt; FONT-FAMILY: Arial">6. Create a Virtuoso HTTP Virtual Domain for the community/personal Blog </span></p>
<P dir=ltr><SPAN style="FONT-SIZE: 10pt; FONT-FAMILY: Arial">7. Start blogging using any Blog Client that supports; Blogger API, MetaWeblog, or Moveable Type</span></p>
<P dir=ltr><SPAN style="FONT-SIZE: 10pt; FONT-FAMILY: Arial">No more no less. Most importantly I have a choice of programming languages (VSP, VSX, PHP, ASP.NET, JSP, Perl, Python), operating systems, and databases that constitute the shape and form of my blog home. </span></p>
<P dir=ltr><SPAN style="FONT-SIZE: 10pt; FONT-FAMILY: Arial">See the<A href="http://www.openlinksw.com/virtuoso/faqs.htm"> Virtuoso FAQ </a>for how this all comes together.</span></p>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-25#183">
  <rss:title>&lt;p&gt;We all know that the only benchmark that matters, is the one that you run in-house using the systems that comprise your IT infrastructure. &lt;/p&gt;</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-06-25T13:27:02Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">We all know that the only benchmark that matters, is the one that you run in-house using the systems that comprise your IT infrastructure. Apple&#39;s benchmarks under fire ZDNet Jun 25 2003 7:13AM ET [via Moreover - ZDNet] OpenLink Software has provided an Open Source benchmark utility that support Mac OS X, Linux, and UNIX. Thus, if mission critical database oriented performance is what is most relevant to your needs (as opposed to Photoshop) then simply download either one, or both of the following: OpenLink ODBC Bench (you can test TPC-A and TPC-C like performance of the G5 and compare against other platforms) via ODBC) OpenLink JDBC Bench (same thing using JDBC)</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<P>We all know that the only benchmark that matters, is the one that you run in-house using the systems that comprise your IT infrastructure. </P>
<BLOCKQUOTE dir=ltr style="MARGIN-RIGHT: 0px">
<P><A href="http://c.moreover.com/click/here.pl?r77267478">Apple's benchmarks under fire</A> ZDNet Jun 25 2003 7:13AM ET </P>
<P>[via <A href="http://www.moreover.com/">Moreover - ZDNet</A>]</P></BLOCKQUOTE>
<P>OpenLink Software has provided an Open Source benchmark utility that support Mac OS X, Linux, and UNIX. Thus, if mission critical database oriented performance is what is most relevant to your needs (as opposed to Photoshop) then simply download either one, or both of the following:</P>
<P><A href="http://oplweb2.openlinksw.com:8080/download/util.vsp">OpenLink ODBC Bench</A> (you can test TPC-A and TPC-C like performance of the G5 and compare against other platforms) via ODBC)</P>
<P><A href="http://oplweb2.openlinksw.com:8080/download/util.vsp">OpenLink JDBC Bench </A>(same thing using JDBC)</P>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-18#138">
  <rss:title>Get Ready for Yukon </rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-06-18T05:19:22Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Get Ready for Yukon The next release of SQL Server promises increased developer productivity and reduced DBA workload. by Roger Jennings June 2003 Issue .NET Magazine After reading this article I decided to put together a simple comparitive analysis of our existing product and the soon to be released Yukon. Our Universal Server product called Virtuoso will compete head on with this future release of SQL Server in many regards (.NET CLR hosting, Native XML Types, SQL-XML, XMLA, Web Services etc.), but I am also keen to see what interesting perspectives Microsoft&#39;s implementation brings to the table. Here is a summary comparison, note that some of the hyperlinks in the table below actually take you to live functionality demos (for effect these links point to a Linux server, and you can change the machine part of the url from &quot;demo&quot; to &quot;kingsleydemo&quot; to see the equivalent demos on an XP server).</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<p><a href="http://www.ftponline.com/dotnetmag/2003_06/magazine/columns/sqlconnection/default.asp">Get Ready for Yukon</a> </p>
<blockquote dir="ltr" style="MARGIN-RIGHT: 0px">
<p>The next release of SQL Server promises increased developer productivity and reduced DBA workload. </p>
<p>by Roger Jennings June 2003 Issue <a href="http://www.ftponline.com/dotnetmag/">.NET Magazine</a> </p></blockquote>
<p>After reading this article I decided to put together a simple comparitive analysis of our existing product and the soon to be released Yukon.</p>
<p>Our <a href="http://www.openlinksw.com/virtuoso/whatis.htm">Universal Server</a> product called <a href="http://www.openlinksw.com/virtuoso">Virtuoso</a> will compete head on with this future release of SQL Server in many regards (.NET CLR hosting, Native XML Types, SQL-XML, XMLA, Web Services etc.), but I am also keen to see what interesting perspectives Microsoft&#39;s implementation brings to the table. Here is a summary comparison, note that some of the hyperlinks in the table below actually take you to live functionality demos (for effect these links point to a Linux server, and you can change the machine part of the url from &quot;demo&quot; to &quot;kingsleydemo&quot; to see the equivalent demos on an XP server).</p>
<table width="97%" border="1">
<tbody>
<tr>
<td width="42%"><font size="2"></font></td></tr></tbody></table>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-10#274">
  <rss:title>RSS Behind the Firewall</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-06-11T03:49:21Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">RSS Behind the Firewall I knew this day would come, but I&#39;ve been trying to avoid it. For roughly a year now, I&#39;ve been happily reading various news source by using RSS aggregators of various form and function. Some were desktop apps and others were server-side. Some for Windows, some for Linux, and some for OS X. In recent months, there&#39;s been growing talk about RSS at work. And I don&#39;t mean things like the Finance, Ask, or Buzz RSS stuff. There&#39;s been talk of using it internally. We have a growing number of internal weblogs (or people looking to experiment with them) and some in-house tools that now generate RSS. This is great. But it&#39;s going to suck too. The honeymoon is over. Now I need to have two aggregators: one at home and one at work. I&#39;m used to doing this for e-mail, but that doesn&#39;t mean I like it. I suppose I could start taking my laptop to work every day, but then I&#39;d have to take my laptop to work everyday. I&#39;ve been thinking about this for a while and haven&#39;t come up with any good solution. I suppose that someone could work on synchronizing aggregators. Then I could sync up my home and work aggregators somehow. Maybe that&#39;ll happen? I wonder if is going to become a more common problem as RSS picks up steam in various companies.[via Jeremy Zawodny&#39;s blog]</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<A href="http://jeremy.zawodny.com/blog/archives/000782.html">RSS Behind the Firewall</A> 
<P>I knew this day would come, but I've been trying to avoid it. For roughly a year now, I've been happily reading various news source by using RSS aggregators of various form and function. Some were desktop apps and others were server-side. Some for Windows, some for Linux, and some for OS X.</P>
<P>In recent months, there's been growing <A href="http://jeremy.zawodny.com/blog/archives/000421.html">talk</A> about RSS at work. And I don't mean things like the <A href="http://jeremy.zawodny.com/mt/mt-search.cgi?search=finance+rss&amp;IncludeBlogs=1">Finance</A>, <A href="http://ask.yahoo.com/ask/index.xml">Ask</A>, or <A href="http://jeremy.zawodny.com/blog/archives/000774.html">Buzz RSS</A> stuff. There's been talk of using it <EM>internally</EM>. We have a growing number of internal weblogs (or people looking to experiment with them) and some in-house tools that now generate RSS.</P>
<P>This is great.</P>
<P>But it's going to suck too.</P>
<P>The honeymoon is over. Now I need to have <EM>two</EM> aggregators: one at home and one at work.</P>
<P>I'm used to doing this for e-mail, but that doesn't mean I like it. I suppose I could start taking my laptop to work every day, but then I'd have to take my laptop to work everyday.</P>
<P>I've been thinking about this for a while and haven't come up with any good solution. I suppose that someone could work on synchronizing aggregators. Then I could sync up my home and work aggregators somehow. Maybe that'll happen?</P>
<P>I wonder if is going to become a more common problem as RSS picks up steam in various companies.[via <A href="http://jeremy.zawodny.com/blog/">Jeremy Zawodny's blog</A>]</P>
<DIV></DIV>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-08#108">
  <rss:title>&lt;p&gt;When Mono is completed, Linux is the option for the desktop.&lt;/p&gt;</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-06-08T18:51:20Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">When Mono is completed, Linux is the option for the desktop. [From Frans Bouma&#39;s blog in Boldface, My comments in italics] Randy Holloway wrote about his vision on Linux and then especially about Linux on the desktop. I disagree with his vision, I think Linux is definitely an option for the desktop at the moment and thus also in the foreseably future. It will become the option for the desktop when Mono is completed. The reason for this is simple: a lot of Windows programs will be written using .NET. If you can run these programs on Linux too, using Mono, what&#39;s keeping you on Windows? Perhaps the games. But definitely not the business applications, since the Linux version for spreadsheets, browsers, wordprocessors, emailprograms and other every-day software are solid today, even when compared to Microsoft Office XP. Linux desktop office applications do not rival those of Windows, in particular Office 2003. We have to be careful when we make generic statements such as this becuase the end result is disappointment and frustation for corporate Linux neophyte. Imagine a corporate power user that has used Excel to produce Pivot tables (like I do) that provide me with a critical success factors dashboard for my enterprise. If I was to move to any of the incarnations of open office this would be lost. Now, for the corporate user -knowledge, information worker- that I believe Randy has in mind this remains a problem re. Linux as a desktop offering today. On the other hand, how true is the position that I presented above? By this I mean, how many knowledge workers actually make use of Pivot Tables in Excel? Something tells me I am the exception rather than the norm. Thus, moving away from Desktop productivity tools of type &quot;Office 200x&quot;, and looking at email, and web browsing etc. Linux certainly matches Windows pound for pound, but is this enough? What is the current &quot;activation threshold&quot; for Windows vs. Linux for a Desktop user (who just wants email and web browsing)? I think this is Linux distribution dependent, now the last time I attempted this experiment (at least over a year ago) Windows won flat out becuase I had to wrestle with X Configuration en route to getting a graphical desktop (I believe this has improved vastly of late, but I need to perform this experiment using current 8.x and higher Linux distros.). I&#39;ve hated Linux and especially its most hardcore supporters, for years. However, you can&#39;t have an unbiased vision on what is best for a given company to use as the OS of choice if you are biased yourself. Mono changed me, I really think Mono is the best Linux has ever experienced: it makes transitions of software written for the Windows platform to a free (as in beer, I don&#39;t believe in the GPL-philosophy) OS possible. Mono is going to be the most significant Linux &lt;--&gt; Windows harmonization effort over the long term. This is because parity will no longer be about getting the likes of Open Office to reach functional parity with &quot;Office 200x&quot; as future Windows applications will be &quot;managed code&quot; in nature (a strategic Microsoft goal over the long term), and Mono&#39;s goal is to run &quot;managed code&quot; outside the Windows platform (this applies to Linux, UNIX, and other platforms). Besides Mono, I do think Linux is a good platform to use for everyday business applications today, because the office tools can use Exchange, they can read/write MS Office documents, so why bother investing in MS software when you can save that money and choose the alternative? The only problem is: when you have a lot of desktops to admin as a sysadmin, and you want to do that with the easy tools in Windows server 2003, you&#39;re out of luck.  Linux is a good platform for everday business applications, but not quite good enough in the area of unravelling it&#39;s value proposition to the point of obvious simplification for corporate decision makers. This is the current hump in the road to this critical destination in my humble opinion. Randy and Frans are making very good points that shed light on some of the less covered aspects of the Linux vs. Windows debate.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<P>When Mono is completed, Linux is the option for the desktop.</P>
<P>[From <A href="http://weblogs.asp.net/fbouma/">Frans Bouma's blog</A>&nbsp;in Boldface, <EM>My comments in italics</EM>]</P>
<P>Randy Holloway <A href="http://weblogs.asp.net/rholloway/posts/8369.aspx">wrote</A> about his <A href="http://weblogs.asp.net/rholloway/posts/8370.aspx">vision on Linux</A> and then especially about Linux on the desktop. I disagree with his vision, I think Linux is definitely an option for the desktop at the moment and thus also in the foreseably future. It will become <EM>the</EM> option for the desktop when Mono is completed. The reason for this is simple: a lot of Windows programs will be written using .NET. If you can run these programs on Linux too, using Mono, what's keeping you on Windows? Perhaps the games. But definitely not the business applications, since the Linux version for spreadsheets, browsers, wordprocessors, emailprograms and other every-day software are solid <EM>today</EM>, even when compared to Microsoft Office XP. </P>
<P><EM>Linux desktop office applications do not rival those of Windows, in particular Office 2003. We have to be careful when we make generic statements such as this becuase the end result is disappointment and frustation for corporate Linux neophyte.</EM></P>
<P><EM>Imagine a corporate power user that has used Excel to produce Pivot tables (like I do) that provide me with a critical success factors dashboard for my enterprise. If I was to move to any of the incarnations of open office this would be lost. Now, for the corporate user -knowledge, information worker- that I believe Randy has in mind this remains a problem re. Linux as a desktop offering today.</EM></P>
<P><EM>On the other hand, how true is the position that I presented above? By this I mean, how many knowledge workers actually make use of Pivot Tables in Excel? Something tells me I am the exception rather than the norm. Thus, moving away from Desktop productivity tools of type "Office 200x", and looking at email, and web browsing etc. Linux certainly matches Windows pound for pound, but is this enough? What is the current "activation threshold" for Windows vs. Linux for a Desktop user (who just wants email and web browsing)? I think this is Linux distribution dependent, now the last time I attempted this experiment (at least over a year ago) Windows won flat out becuase I had to wrestle with X Configuration en route to getting a graphical desktop (I believe this has improved vastly of late, but I need to perform this experiment using current 8.x and higher Linux distros.).</EM></P>
<P>I've hated Linux and especially its most hardcore supporters, for years. However, you can't have an unbiased vision on what is best for a given company to use as the OS of choice if you are biased yourself. Mono changed me, I really think Mono is the best Linux has ever experienced: it makes transitions of software written for the Windows platform to a free (as in beer, I don't believe in the GPL-philosophy) OS possible.</P>
<P><EM>Mono is going to be the most significant Linux &lt;--&gt; Windows harmonization effort over the long term. This is because parity will no longer be about getting the likes of Open Office to reach functional parity with "Office 200x" as future Windows applications will be "managed code" in nature (a strategic Microsoft goal over the long term), and Mono's goal is to run "managed code" outside the Windows platform (this applies to Linux, UNIX, and other platforms).</EM></P>
<P>Besides Mono, I do think Linux is a good platform to use for everyday business applications today, because the office tools can use Exchange, they can read/write MS Office documents, so why bother investing in MS software when you can save that money and choose the alternative? The only problem is: when you have a lot of desktops to admin as a sysadmin, and you want to do that with the easy tools in Windows server 2003, you're out of luck.&nbsp;</P>
<P><EM>Linux is a good platform for everday business applications, but not quite good&nbsp;enough in the area of unravelling it's value proposition to the point of obvious simplification for&nbsp;corporate decision makers. This is the current hump in the road to this critical destination in my humble opinion.</EM></P>
<P><EM>Randy and Frans are making very good points that shed light on some of the less covered aspects of the Linux vs. Windows debate.</EM></P>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-08#261">
  <rss:title>&lt;p&gt;When Mono is completed, Linux is the option for the desktop.&lt;/p&gt;</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-06-08T18:51:20Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">When Mono is completed, Linux is the option for the desktop. [From Frans Bouma&#39;s blog in Boldface, My comments in italics] Randy Holloway wrote about his vision on Linux and then especially about Linux on the desktop. I disagree with his vision, I think Linux is definitely an option for the desktop at the moment and thus also in the foreseably future. It will become the option for the desktop when Mono is completed. The reason for this is simple: a lot of Windows programs will be written using .NET. If you can run these programs on Linux too, using Mono, what&#39;s keeping you on Windows? Perhaps the games. But definitely not the business applications, since the Linux version for spreadsheets, browsers, wordprocessors, emailprograms and other every-day software are solid today, even when compared to Microsoft Office XP. Linux desktop office applications do not rival those of Windows, in particular Office 2003. We have to be careful when we make generic statements such as this becuase the end result is disappointment and frustation for corporate Linux neophyte. Imagine a corporate power user that has used Excel to produce Pivot tables (like I do) that provide me with a critical success factors dashboard for my enterprise. If I was to move to any of the incarnations of open office this would be lost. Now, for the corporate user -knowledge, information worker- that I believe Randy has in mind this remains a problem re. Linux as a desktop offering today. On the other hand, how true is the position that I presented above? By this I mean, how many knowledge workers actually make use of Pivot Tables in Excel? Something tells me I am the exception rather than the norm. Thus, moving away from Desktop productivity tools of type &quot;Office 200x&quot;, and looking at email, and web browsing etc. Linux certainly matches Windows pound for pound, but is this enough? What is the current &quot;activation threshold&quot; for Windows vs. Linux for a Desktop user (who just wants email and web browsing)? I think this is Linux distribution dependent, now the last time I attempted this experiment (at least over a year ago) Windows won flat out becuase I had to wrestle with X Configuration en route to getting a graphical desktop (I believe this has improved vastly of late, but I need to perform this experiment using current 8.x and higher Linux distros.). I&#39;ve hated Linux and especially its most hardcore supporters, for years. However, you can&#39;t have an unbiased vision on what is best for a given company to use as the OS of choice if you are biased yourself. Mono changed me, I really think Mono is the best Linux has ever experienced: it makes transitions of software written for the Windows platform to a free (as in beer, I don&#39;t believe in the GPL-philosophy) OS possible. Mono is going to be the most significant Linux &lt;--&gt; Windows harmonization effort over the long term. This is because parity will no longer be about getting the likes of Open Office to reach functional parity with &quot;Office 200x&quot; as future Windows applications will be &quot;managed code&quot; in nature (a strategic Microsoft goal over the long term), and Mono&#39;s goal is to run &quot;managed code&quot; outside the Windows platform (this applies to Linux, UNIX, and other platforms). Besides Mono, I do think Linux is a good platform to use for everyday business applications today, because the office tools can use Exchange, they can read/write MS Office documents, so why bother investing in MS software when you can save that money and choose the alternative? The only problem is: when you have a lot of desktops to admin as a sysadmin, and you want to do that with the easy tools in Windows server 2003, you&#39;re out of luck.  Linux is a good platform for everday business applications, but not quite good enough in the area of unravelling it&#39;s value proposition to the point of obvious simplification for corporate decision makers. This is the current hump in the road to this critical destination in my humble opinion. Randy and Frans are making very good points that shed light on some of the less covered aspects of the Linux vs. Windows debate.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<P>When Mono is completed, Linux is the option for the desktop.</P>
<P>[From <A href="http://weblogs.asp.net/fbouma/">Frans Bouma's blog</A>&nbsp;in Boldface, <EM>My comments in italics</EM>]</P>
<P>Randy Holloway <A href="http://weblogs.asp.net/rholloway/posts/8369.aspx">wrote</A> about his <A href="http://weblogs.asp.net/rholloway/posts/8370.aspx">vision on Linux</A> and then especially about Linux on the desktop. I disagree with his vision, I think Linux is definitely an option for the desktop at the moment and thus also in the foreseably future. It will become <EM>the</EM> option for the desktop when Mono is completed. The reason for this is simple: a lot of Windows programs will be written using .NET. If you can run these programs on Linux too, using Mono, what's keeping you on Windows? Perhaps the games. But definitely not the business applications, since the Linux version for spreadsheets, browsers, wordprocessors, emailprograms and other every-day software are solid <EM>today</EM>, even when compared to Microsoft Office XP. </P>
<P><EM>Linux desktop office applications do not rival those of Windows, in particular Office 2003. We have to be careful when we make generic statements such as this becuase the end result is disappointment and frustation for corporate Linux neophyte.</EM></P>
<P><EM>Imagine a corporate power user that has used Excel to produce Pivot tables (like I do) that provide me with a critical success factors dashboard for my enterprise. If I was to move to any of the incarnations of open office this would be lost. Now, for the corporate user -knowledge, information worker- that I believe Randy has in mind this remains a problem re. Linux as a desktop offering today.</EM></P>
<P><EM>On the other hand, how true is the position that I presented above? By this I mean, how many knowledge workers actually make use of Pivot Tables in Excel? Something tells me I am the exception rather than the norm. Thus, moving away from Desktop productivity tools of type "Office 200x", and looking at email, and web browsing etc. Linux certainly matches Windows pound for pound, but is this enough? What is the current "activation threshold" for Windows vs. Linux for a Desktop user (who just wants email and web browsing)? I think this is Linux distribution dependent, now the last time I attempted this experiment (at least over a year ago) Windows won flat out becuase I had to wrestle with X Configuration en route to getting a graphical desktop (I believe this has improved vastly of late, but I need to perform this experiment using current 8.x and higher Linux distros.).</EM></P>
<P>I've hated Linux and especially its most hardcore supporters, for years. However, you can't have an unbiased vision on what is best for a given company to use as the OS of choice if you are biased yourself. Mono changed me, I really think Mono is the best Linux has ever experienced: it makes transitions of software written for the Windows platform to a free (as in beer, I don't believe in the GPL-philosophy) OS possible.</P>
<P><EM>Mono is going to be the most significant Linux &lt;--&gt; Windows harmonization effort over the long term. This is because parity will no longer be about getting the likes of Open Office to reach functional parity with "Office 200x" as future Windows applications will be "managed code" in nature (a strategic Microsoft goal over the long term), and Mono's goal is to run "managed code" outside the Windows platform (this applies to Linux, UNIX, and other platforms).</EM></P>
<P>Besides Mono, I do think Linux is a good platform to use for everyday business applications today, because the office tools can use Exchange, they can read/write MS Office documents, so why bother investing in MS software when you can save that money and choose the alternative? The only problem is: when you have a lot of desktops to admin as a sysadmin, and you want to do that with the easy tools in Windows server 2003, you're out of luck.&nbsp;</P>
<P><EM>Linux is a good platform for everday business applications, but not quite good&nbsp;enough in the area of unravelling it's value proposition to the point of obvious simplification for&nbsp;corporate decision makers. This is the current hump in the road to this critical destination in my humble opinion.</EM></P>
<P><EM>Randy and Frans are making very good points that shed light on some of the less covered aspects of the Linux vs. Windows debate.</EM></P>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-08#258">
  <rss:title>Merrill Lynch: Linux saves money</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-06-08T17:05:58Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Merrill Lynch: Linux saves money An executive at the investment banker says research shows that deploying Linux internally that could save the company millions of dollars. [via CNET News.com] &lt;exception/&gt;</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<A href="http://rss.com.com/2100-1016_3-1014287.html?type=pt&amp;part=rss&amp;tag=feed&amp;subj=news">Merrill Lynch: Linux saves money</A> An executive at the investment banker says research shows that deploying Linux internally that could save the company millions of dollars. [via <A href="http://www.news.com/">CNET News.com</A>]
<DIV>&lt;exception/&gt;</DIV>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-06#257">
  <rss:title>Intel Benchmark Test: Linux Goes to 600,000</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-06-07T02:26:03Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Intel Benchmark Test: Linux Goes to 600,000 &quot;...Using the TPC-C benchmark test, Intel measured the computing performance of a 32-processor Itanium server running Linux, getting a score of almost 600,000 transactions per minute. &quot;Seems Linux is moving up to where the big boys play. (jobert) [via Lockergnome&#39;s Bits and Bytes]</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<A href="http://www.lockergnome.com/update/archives/week_2003_06_01.html#005803">Intel Benchmark Test: Linux Goes to 600,000</A> "...Using the TPC-C benchmark test, Intel measured the computing performance of a 32-processor Itanium server running Linux, getting a score of almost 600,000 transactions per minute. "<BR><BR>Seems Linux is moving up to where the big boys play. (jobert) [via <A href="http://update.lockergnome.com/">Lockergnome's Bits and Bytes</A>]
<DIV></DIV>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-06#103">
  <rss:title>Intel Benchmark Test: Linux Goes to 600,000</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-06-07T02:25:32Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Intel Benchmark Test: Linux Goes to 600,000 &quot;...Using the TPC-C benchmark test, Intel measured the computing performance of a 32-processor Itanium server running Linux, getting a score of almost 600,000 transactions per minute. &quot;Seems Linux is moving up to where the big boys play. (jobert) [via Lockergnome&#39;s Bits and Bytes]</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<a href="http://www.lockergnome.com/update/archives/week_2003_06_01.html#005803">Intel Benchmark Test: Linux Goes to 600,000</a> &quot;...Using the TPC-C benchmark test, Intel measured the computing performance of a 32-processor Itanium server running Linux, getting a score of almost 600,000 transactions per minute. &quot;<br /><br />Seems Linux is moving up to where the big boys play. (jobert) [via <a href="http://update.lockergnome.com/">Lockergnome&#39;s Bits and Bytes</a>]
<div></div>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-06#256">
  <rss:title>Intel Benchmark Test: Linux Goes to 600,000</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-06-07T02:25:32Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Intel Benchmark Test: Linux Goes to 600,000 &quot;...Using the TPC-C benchmark test, Intel measured the computing performance of a 32-processor Itanium server running Linux, getting a score of almost 600,000 transactions per minute. &quot;Seems Linux is moving up to where the big boys play. (jobert) [via Lockergnome&#39;s Bits and Bytes]</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<A href="http://www.lockergnome.com/update/archives/week_2003_06_01.html#005803">Intel Benchmark Test: Linux Goes to 600,000</A> "...Using the TPC-C benchmark test, Intel measured the computing performance of a 32-processor Itanium server running Linux, getting a score of almost 600,000 transactions per minute. "<BR><BR>Seems Linux is moving up to where the big boys play. (jobert) [via <A href="http://update.lockergnome.com/">Lockergnome's Bits and Bytes</A>]
<DIV></DIV>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-06#255">
  <rss:title>UK councils dump Windows for Linux</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-06-06T13:58:46Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">UK councils dump Windows for Linux ZDNet Jun 6 2003 9:09AM ET [via Moreover - ZDNet] The move has particular significance since the council last year completed a successful e-government &#39;pathfinder&#39; project involving a group of neighbouring councils: Barking and Dagenham, Hackney, Havering, Redbridge, Thanet, Tower Hamlets and Waltham Forest. &quot;If this is seen to work in Newham, it has the potential to be a significant project, changing the perceptions of other councils,&quot; said Tim Dawes, director of local government technology consultants Nineveh. Nottingham is set to decide on new software for its 6,500 desktop PCs by the end of 2003 and confirmed to E-Government Bulletin this week that open source solutions are being considered. The news follows the council&#39;s successful migration to a Linux-based email system last year, after suffering numerous problems with its proprietary system. According to technology manager Richard Heggs, shifting to open source messaging has cut costs by at least a third, a saving that would be repeated for desktops. Looks like the municipalities figured out the cost-benefits of Linux vs. Windows much quicker than the corporates.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<A href="http://c.moreover.com/click/here.pl?r74774733">UK councils dump Windows for Linux</A> ZDNet Jun 6 2003 9:09AM ET 
<DIV align=right>[via <A href="http://www.moreover.com/">Moreover - ZDNet</A>]</DIV>
<P class=a2 align=left>The move has particular significance since the council last year completed a successful e-government 'pathfinder' project involving a group of neighbouring councils: Barking and Dagenham, Hackney, Havering, Redbridge, Thanet, Tower Hamlets and Waltham Forest. </P>
<P class=a2 align=left>"If this is seen to work in Newham, it has the potential to be a significant project, changing the perceptions of other councils," said Tim Dawes, director of local government technology consultants Nineveh. </P>
<P class=a2 align=left>Nottingham is set to decide on new software for its 6,500 desktop PCs by the end of 2003 and confirmed to E-Government Bulletin this week that open source solutions are being considered. The news follows the council's successful migration to a Linux-based email system last year, after suffering numerous problems with its proprietary system. </P>
<P class=a2 align=left>According to technology manager Richard Heggs, shifting to open source messaging has cut costs by at least a third, a saving that would be repeated for desktops. </P>
<P class=a2 align=left><EM>Looks like the municipalities figured out the cost-benefits of Linux vs. Windows much quicker than the corporates.</EM></P>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-05#100">
  <rss:title>Linux vs SCO: An opinion from the BSD point of view.</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-06-06T02:47:06Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Linux vs SCO: An opinion from the BSD point of view. &lt;P&gt; Greg Lehey has written an excellent article for Daemon News on the Linux versus SCO debacle from the point of view of a BSD user. (Or at least from the point of view of one BSD user). &lt;P&gt; One particularly interesting idea: &lt;P&gt; &lt;blockquote&gt; &lt;quote&gt; Linux source code is freely available. UnixWare source code is not, even less than many other proprietary UNIX implementations. Thus it would be easier to copy code from Linux to UnixWare then from UnixWare to Linux. &lt;/quote&gt; &lt;/blockquote&gt; &lt;P&gt; Lehey also has a page tracking the debate. [via Meerkat: An Open Wire Service: O&#39;Reilly Network Weblogs]</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<A href="http://www.oreillynet.com/pub/wlg/3268">Linux vs SCO: An opinion from the BSD point of view.</A> &lt;P&gt; Greg Lehey has written an excellent article for Daemon News on the Linux versus SCO debacle from the point of view of a BSD user. (Or at least from the point of view of one BSD user). &lt;P&gt; One particularly interesting idea: &lt;P&gt; &lt;blockquote&gt; &lt;quote&gt; Linux source code is freely available. UnixWare source code is not, even less than many other proprietary UNIX implementations. Thus it would be easier to copy code from Linux to UnixWare then from UnixWare to Linux. &lt;/quote&gt; &lt;/blockquote&gt; &lt;P&gt; Lehey also has a page tracking the debate. [via <A href="http://meerkat.oreillynet.com/">Meerkat: An Open Wire Service: O'Reilly Network Weblogs</A>]
<DIV></DIV>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-05#253">
  <rss:title>Linux vs SCO: An opinion from the BSD point of view.</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-06-06T02:47:06Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Linux vs SCO: An opinion from the BSD point of view. &lt;P&gt; Greg Lehey has written an excellent article for Daemon News on the Linux versus SCO debacle from the point of view of a BSD user. (Or at least from the point of view of one BSD user). &lt;P&gt; One particularly interesting idea: &lt;P&gt; &lt;blockquote&gt; &lt;quote&gt; Linux source code is freely available. UnixWare source code is not, even less than many other proprietary UNIX implementations. Thus it would be easier to copy code from Linux to UnixWare then from UnixWare to Linux. &lt;/quote&gt; &lt;/blockquote&gt; &lt;P&gt; Lehey also has a page tracking the debate. [via Meerkat: An Open Wire Service: O&#39;Reilly Network Weblogs]</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<A href="http://www.oreillynet.com/pub/wlg/3268">Linux vs SCO: An opinion from the BSD point of view.</A> &lt;P&gt; Greg Lehey has written an excellent article for Daemon News on the Linux versus SCO debacle from the point of view of a BSD user. (Or at least from the point of view of one BSD user). &lt;P&gt; One particularly interesting idea: &lt;P&gt; &lt;blockquote&gt; &lt;quote&gt; Linux source code is freely available. UnixWare source code is not, even less than many other proprietary UNIX implementations. Thus it would be easier to copy code from Linux to UnixWare then from UnixWare to Linux. &lt;/quote&gt; &lt;/blockquote&gt; &lt;P&gt; Lehey also has a page tracking the debate. [via <A href="http://meerkat.oreillynet.com/">Meerkat: An Open Wire Service: O'Reilly Network Weblogs</A>]
<DIV></DIV>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-06-04#363">
  <rss:title>Ballmer memo targets Linux</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-06-05T00:08:22Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Ballmer memo targets Linux ZDNet Jun 4 2003 2:32PM ET [via Moreover - ZDNet] Key Quote from Ballmer: &quot;Information is the lifeblood of business,&quot; Ballmer countered, &quot;and software is what gives people and businesses the ability to harness it. Software is what enables us to collect, manipulate, access, store, share, analyze and act on information. It enables companies to constantly hone their competitive edge. So, contrary to the idea that we&#39;re entering a &#39;post-technological era,&#39; I believe that taking software to the next level will be one of the biggest sources of value creation for customers, and that Microsoft is well-positioned to enable this and to benefit from it.&quot;</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<A href="http://c.moreover.com/click/here.pl?r74497334">Ballmer memo targets Linux</A> ZDNet Jun 4 2003 2:32PM ET [via <A href="http://www.moreover.com/">Moreover - ZDNet</A>] 
<DIV></DIV>
<P><EM>Key Quote&nbsp;from Ballmer:</EM></P>
<P>"Information is the lifeblood of business," Ballmer countered, "and software is what gives people and businesses the ability to harness it. Software is what enables us to collect, manipulate, access, store, share, analyze and act on information. It enables companies to constantly hone their competitive edge. So, contrary to the idea that we're entering a 'post-technological era,' I believe that taking software to the next level will be one of the biggest sources of value creation for customers, and that Microsoft is well-positioned to enable this and to benefit from it." </P>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-05-30#346">
  <rss:title>Microsoft Linux? Or Microsoft Unix?</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-05-30T21:25:37Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Microsoft Linux? Or Microsoft Unix? Ryan writes &quot;Microsoft working on a version of Linux? Mike Elgan writes that the Redmond company is losing its grip on the government market, and when the corporate market falls it will be motivated to release its own Linux distribution. Microsoft Linux may soon be more than just a hoax!&quot; Of course, the argument isn&#39;t based on any actual knowledge, but just a reasoned guess. This rumor/prediction seems to pop up every few months, and I usually just ignore it. However, now, the latest I, Cringely column has a much more well reasoned analysis of why he thinks Microsoft is going to launch their own Unix. He thinks that&#39;s the real reason behind their recent licensing of Unix IP from SCO. They realized that if they&#39;re going to launch their own Unix-style operating system, why not make it actually Unix, instead of Linux? As I said, these rumors (and hoaxes) have been around for ages, so I wouldn&#39;t put too much weight into them at this point. [via Techdirt]</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<a href="http://techdirt.com/articles/20030530/1425224.shtml">Microsoft Linux? Or Microsoft Unix?</a> <b>Ryan</b> writes <i>&quot;Microsoft working on a version of Linux? Mike Elgan writes that the Redmond company is losing its grip on the government market, and when the corporate market falls it will be motivated to release its own Linux distribution. <a href="http://www.mikeslist.com/65.htm">Microsoft Linux</a> may soon be more than just a <a href="http://www.mslinux.org/">hoax</a>!&quot;</i> Of course, the argument isn&#39;t based on any actual knowledge, but just a reasoned guess. This rumor/prediction seems to pop up every few months, and I usually just ignore it. However, now, the latest I, Cringely column has a much more well reasoned analysis of why he thinks <a href="http://www.pbs.org/cringely/pulpit/pulpit20030529.html">Microsoft is going to launch their own Unix</a>. He thinks that&#39;s the real reason behind their recent licensing of Unix IP from SCO. They realized that if they&#39;re going to launch their own Unix-style operating system, why not make it actually Unix, instead of Linux? As I said, these rumors (and hoaxes) have been around for ages, so I wouldn&#39;t put too much weight into them at this point. [via <a href="http://www.techdirt.com/">Techdirt</a>]
<div></div>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-05-22#52">
  <rss:title>&lt;a href=&quot;http://www.go-mono.com/index.html#May20th,2003:OpenLinkreleasesWineLibpatches.&quot;&gt;May 20th, 2003: OpenLink releases WineLib patches.&lt;/a&gt;</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-05-22T20:13:33Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">May 20th, 2003: OpenLink releases WineLib patches. OpenLink announced the release of Vladimir&#39;s work to turn Wine into a library that can be used dynamically from Mono. This work simplifies the work on System.Windows.Forms as it is no longer necessary have a special version of the GC, nor have a stub program.  [via Mono Project News]   What has happened here is that we have created an  a Linux/UNIX shared library based API for WINE (which is a WIN32 emulation layer). This will accelerate (via development simplication) the System.Windows.Forms namespace implementation within Mono.  </dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<A href="http://www.go-mono.com/index.html#May20th,2003:OpenLinkreleasesWineLibpatches.">May 20th, 2003: OpenLink releases WineLib patches.</A> OpenLink <A href="http://lists.ximian.com/archives/public/mono-winforms-list/2003-May/000284.html">announced</A> the release of Vladimir's work to turn Wine into a library that can be used dynamically from Mono. This work simplifies the work on System.Windows.Forms as it is no longer necessary have a special version of the GC, nor have a stub program.&nbsp; [via <A href="http://www.go-mono.com/">Mono Project News</A>]
<DIV><EM></EM>&nbsp;</DIV>
<DIV><EM>What has happened here is that we have created an&nbsp; a Linux/UNIX shared library based API for <A href="http://www.winehq.com">WINE</A> (which is a WIN32 emulation layer). This&nbsp;will accelerate (via development simplication) the System.Windows.Forms namespace implementation within Mono.</EM></DIV>
<DIV><EM></EM>&nbsp;</DIV>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-05-22#322">
  <rss:title>&lt;a href=&quot;http://www.oreillynet.com/pub/wlg/3218&quot;&gt;Sue me, I&amp;#39;m a Linux User!&lt;/a&gt;</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-05-22T16:14:26Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Sue me, I&#39;m a Linux User! In a great example of Linux users banding together to fight SCO&#39;s attempt to exert ownership over portions of the Linux operating system, there&#39;s now an on-line petition available where thousands of Linux users are literally offering SCO an opportunity to sue them. &lt;p&gt; The petition is appropriately titled, &quot;Hey SCO - Sue Me!&quot;. &lt;p&gt; Check it out - or join the crowd! [via Meerkat: An Open Wire Service: O&#39;Reilly Network Weblogs]</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<A href="http://www.oreillynet.com/pub/wlg/3218">Sue me, I'm a Linux User!</A> In a great example of Linux users banding together to fight SCO's attempt to exert ownership over portions of the Linux operating system, there's now an on-line petition available where thousands of Linux users are literally offering SCO an opportunity to sue them. &lt;p&gt; The petition is appropriately titled, "Hey SCO - Sue Me!". &lt;p&gt; Check it out - or join the crowd! 
<DIV align=right>[via <A href="http://meerkat.oreillynet.com/">Meerkat: An Open Wire Service: O'Reilly Network Weblogs</A>]
<DIV></DIV></DIV>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-05-22#50">
  <rss:title>&lt;a href=&quot;http://www.oreillynet.com/pub/wlg/3218&quot;&gt;Sue me, I&amp;#39;m a Linux User!&lt;/a&gt;</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-05-22T16:14:26Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Sue me, I&#39;m a Linux User! In a great example of Linux users banding together to fight SCO&#39;s attempt to exert ownership over portions of the Linux operating system, there&#39;s now an on-line petition available where thousands of Linux users are literally offering SCO an opportunity to sue them. &lt;p&gt; The petition is appropriately titled, &quot;Hey SCO - Sue Me!&quot;. &lt;p&gt; Check it out - or join the crowd! [via Meerkat: An Open Wire Service: O&#39;Reilly Network Weblogs]</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<a href="http://www.oreillynet.com/pub/wlg/3218">Sue me, I&#39;m a Linux User!</a> In a great example of Linux users banding together to fight SCO&#39;s attempt to exert ownership over portions of the Linux operating system, there&#39;s now an on-line petition available where thousands of Linux users are literally offering SCO an opportunity to sue them. &lt;p&gt; The petition is appropriately titled, &quot;Hey SCO - Sue Me!&quot;. &lt;p&gt; Check it out - or join the crowd! 
<div align="right">[via <a href="http://meerkat.oreillynet.com/">Meerkat: An Open Wire Service: O&#39;Reilly Network Weblogs</a>]
<div></div></div>]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-05-20#308">
  <rss:title>&lt;h2 class=&quot;title&quot; style=&quot;CLEAR: both&quot;&gt;The meaning of &lt;/h2&gt;</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-05-20T14:35:44Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">0</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[0]]></content:encoded>
 </rss:item>
 <rss:item xmlns:rss="http://purl.org/rss/1.0/" rdf:about="http://www.openlinksw.com/blog/kidehen@openlinksw.com/blog/?date=2003-05-18#305">
  <rss:title>&lt;a href=&quot;http://c.moreover.com/click/here.pl?r72328568&quot;&gt;Microsoft to license SCO Group Unix rights&lt;/a&gt;</rss:title>
  <dc:date xmlns:dc="http://purl.org/dc/elements/1.1/">2003-05-18T18:25:00Z</dc:date>
  <dc:description xmlns:dc="http://purl.org/dc/elements/1.1/">Microsoft to license SCO Group Unix rights ZDNet May 19 2003 2:37AM ET [via Moreover - ZDNet] Houston! We have a problem.Note, that Bill Gates was an early backer of the Original SCO company (the one that licensed the AT&amp;T UNIX license), and this was prior to SCO acquiring Unixware (the AT&amp;T UNIX IP vehicle).  I think IBM and the other large Linux stake holders may have screwed up here, and Microsoft is going make this clearer in the not to distant future.</dc:description>
  <content:encoded xmlns:content="http://purl.org/rss/1.0/modules/content/"><![CDATA[<A href="http://c.moreover.com/click/here.pl?r72328568">Microsoft to license SCO Group Unix rights</A> ZDNet May 19 2003 2:37AM ET 
<DIV align=right>[via <A href="http://www.moreover.com/">Moreover - ZDNet</A>]
<DIV></DIV></DIV>Houston! We have a problem.<BR>Note, that Bill Gates was an early backer of the Original SCO company (the one that licensed the AT&amp;T UNIX license), and this was prior to SCO acquiring Unixware (the AT&amp;T UNIX IP vehicle).&nbsp; I think IBM and the other large Linux stake holders may have screwed up here, and Microsoft is going make this clearer in the not to distant future.]]></content:encoded>
 </rss:item>
</rdf:RDF>