<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	>

<channel>
	<title>OpenSource Connections &#124; Solr, Big Data, and NoSQL consultants</title>
	<atom:link href="http://www.opensourceconnections.com/feed/" rel="self" type="application/rss+xml" />
	<link>http://www.opensourceconnections.com</link>
	<description>Optimal data structures for rich, discovery-driven user interfaces</description>
	<lastBuildDate>Wed, 22 May 2013 20:29:21 +0000</lastBuildDate>
	<language>en-US</language>
	<sy:updatePeriod>hourly</sy:updatePeriod>
	<sy:updateFrequency>1</sy:updateFrequency>
	<generator>http://wordpress.org/?v=3.5.1</generator>
		<item>
		<title>What happened to CharStream/CharReader in Lucene?</title>
		<link>http://www.opensourceconnections.com/2013/05/22/what-happened-to-charstreamcharreader-in-lucene/</link>
		<comments>http://www.opensourceconnections.com/2013/05/22/what-happened-to-charstreamcharreader-in-lucene/#comments</comments>
		<pubDate>Wed, 22 May 2013 20:29:21 +0000</pubDate>
		<dc:creator>Doug Turnbull</dc:creator>
				<category><![CDATA[solr]]></category>

		<guid isPermaLink="false">http://www.opensourceconnections.com/?p=3557</guid>
		<description><![CDATA[A pretty subtle change happened in the transition from Lucene/Solr 3 to 4. The abstract method for CharFilterFactory changed from public CharStream create(CharStream input); to public abstract Reader create(Reader input); What ’s up with this change? Why did it happen? Well first, let’s take a step back and explain why CharStream existed. CharStream inherited from [...]]]></description>
		<wfw:commentRss>http://www.opensourceconnections.com/2013/05/22/what-happened-to-charstreamcharreader-in-lucene/feed/</wfw:commentRss>
		<slash:comments>2</slash:comments>
		</item>
		<item>
		<title>Introducing OSCAR! Search your notes no matter where they live!</title>
		<link>http://www.opensourceconnections.com/2013/05/21/introducing-oscar-search-your-notes-no-matter-where-they-live/</link>
		<comments>http://www.opensourceconnections.com/2013/05/21/introducing-oscar-search-your-notes-no-matter-where-they-live/#comments</comments>
		<pubDate>Tue, 21 May 2013 16:28:18 +0000</pubDate>
		<dc:creator>Krystal Xu</dc:creator>
				<category><![CDATA[solr]]></category>

		<guid isPermaLink="false">http://www.opensourceconnections.com/?p=3548</guid>
		<description><![CDATA[In our daily adventures on our computers and the Internet, we often find/create notes or documents that we would like to keep for later, that we attempt to organize. We put them in our email, in Google Docs, in Dropbox, in Gist, and countless other places. Then when we want to find them later, it’s [...]]]></description>
		<wfw:commentRss>http://www.opensourceconnections.com/2013/05/21/introducing-oscar-search-your-notes-no-matter-where-they-live/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
		<item>
		<title>Initial Impressions of Elasticsearch &#8211; Flexible Open Source Distributed Search</title>
		<link>http://www.opensourceconnections.com/2013/05/20/initial-impressions-of-elasticsearch-flexible-open-source-distributed-search/</link>
		<comments>http://www.opensourceconnections.com/2013/05/20/initial-impressions-of-elasticsearch-flexible-open-source-distributed-search/#comments</comments>
		<pubDate>Mon, 20 May 2013 21:28:42 +0000</pubDate>
		<dc:creator>Jonathan Thompson</dc:creator>
				<category><![CDATA[Big Data]]></category>

		<guid isPermaLink="false">http://www.opensourceconnections.com/?p=3546</guid>
		<description><![CDATA[I’m Jonathan Thompson, a rising 4th year CS major at UVA. This is my first blog post as an intern at OSC, I hope you enjoy it! While my teammate Krystal worked on integrating OSCAR, the OSC Automated Robot, with Solr, I forked the project and used it as an opportunity to demo Elasticsearch. Was [...]]]></description>
		<wfw:commentRss>http://www.opensourceconnections.com/2013/05/20/initial-impressions-of-elasticsearch-flexible-open-source-distributed-search/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
		<item>
		<title>National Day of Civic Hacking at OpenSource Connections</title>
		<link>http://www.opensourceconnections.com/2013/05/20/national-day-of-civic-hacking-at-opensource-connections/</link>
		<comments>http://www.opensourceconnections.com/2013/05/20/national-day-of-civic-hacking-at-opensource-connections/#comments</comments>
		<pubDate>Mon, 20 May 2013 20:37:00 +0000</pubDate>
		<dc:creator>Matt Overstreet</dc:creator>
				<category><![CDATA[Big Data]]></category>
		<category><![CDATA[Community]]></category>
		<category><![CDATA[Government]]></category>
		<category><![CDATA[hadoop]]></category>
		<category><![CDATA[News]]></category>
		<category><![CDATA[Python]]></category>
		<category><![CDATA[Ruby]]></category>

		<guid isPermaLink="false">http://www.opensourceconnections.com/?p=3542</guid>
		<description><![CDATA[National Day of Civic Hacking at OpenSource Connections What OSC is excited to join 86 other venues across the US for civic hacking and camaraderie. Come join us and find like minded folks to help you save the world. Better yet, lend your skills to someone else&apos;s great idea! When Saturday, June 1 from 9:00AM [...]]]></description>
		<wfw:commentRss>http://www.opensourceconnections.com/2013/05/20/national-day-of-civic-hacking-at-opensource-connections/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
		<item>
		<title>How does a search engine work? An educational trek through a Lucene Postings Format</title>
		<link>http://www.opensourceconnections.com/2013/05/20/how-does-a-search-engine-work-an-educational-trek-through-a-lucene-postings-format/</link>
		<comments>http://www.opensourceconnections.com/2013/05/20/how-does-a-search-engine-work-an-educational-trek-through-a-lucene-postings-format/#comments</comments>
		<pubDate>Mon, 20 May 2013 14:13:06 +0000</pubDate>
		<dc:creator>Doug Turnbull</dc:creator>
				<category><![CDATA[solr]]></category>

		<guid isPermaLink="false">http://www.opensourceconnections.com/?p=3523</guid>
		<description><![CDATA[A new feature of Lucene 4 – pluggable codecs – allows for the modification of Lucene’s underlying storage engine. Working with codecs and examining their output yields fascinating insights into how exactly Lucene’s search works in its most fundamental form. The centerpiece of a Lucene codec is it’s postings format. Postings are a commonly thrown [...]]]></description>
		<wfw:commentRss>http://www.opensourceconnections.com/2013/05/20/how-does-a-search-engine-work-an-educational-trek-through-a-lucene-postings-format/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
		<item>
		<title>Does FoundationDB beat the CAP conjecture?  Hackathon on Friday!</title>
		<link>http://www.opensourceconnections.com/2013/05/06/does-foundationdb-beat-the-cap-conjecture-hackathon-on-friday/</link>
		<comments>http://www.opensourceconnections.com/2013/05/06/does-foundationdb-beat-the-cap-conjecture-hackathon-on-friday/#comments</comments>
		<pubDate>Mon, 06 May 2013 20:45:59 +0000</pubDate>
		<dc:creator>Eric Pugh</dc:creator>
				<category><![CDATA[Community]]></category>
		<category><![CDATA[FoundationDB]]></category>
		<category><![CDATA[News]]></category>
		<category><![CDATA[Rapid Prototyping]]></category>
		<category><![CDATA[coworking]]></category>
		<category><![CDATA[hackathon]]></category>

		<guid isPermaLink="false">http://www.opensourceconnections.com/?p=3502</guid>
		<description><![CDATA[We&#8217;re cohosting a hackathon with FoundationDB on Friday. For those of you not in the know, FoundationDB is a pretty exciting addition to the NoSQL space. It brings flexible, arbitrary transactionality (including atomic cross-row joins in a distributed system) to NoSQL. My colleague Doug Turnbull got very excited about the technology a few months ago [...]]]></description>
		<wfw:commentRss>http://www.opensourceconnections.com/2013/05/06/does-foundationdb-beat-the-cap-conjecture-hackathon-on-friday/feed/</wfw:commentRss>
		<slash:comments>1</slash:comments>
		</item>
		<item>
		<title>Search is Eating The World &#124; Recap of Lucene Revolution</title>
		<link>http://www.opensourceconnections.com/2013/05/06/search-is-eating-the-world-recap-of-lucene-revolution/</link>
		<comments>http://www.opensourceconnections.com/2013/05/06/search-is-eating-the-world-recap-of-lucene-revolution/#comments</comments>
		<pubDate>Mon, 06 May 2013 15:17:20 +0000</pubDate>
		<dc:creator>Doug Turnbull</dc:creator>
				<category><![CDATA[solr]]></category>

		<guid isPermaLink="false">http://www.opensourceconnections.com/?p=3478</guid>
		<description><![CDATA[Much of the crew just got back from Lucene Revolution. It was an incredible experience to hang out with the cream-of-the-crop of the Lucene/Solr community. It continues to be clear that modern applications of all stripes are increasingly driven by search as the primary UI component. Users of these applications expect rich interactivity. And because [...]]]></description>
		<wfw:commentRss>http://www.opensourceconnections.com/2013/05/06/search-is-eating-the-world-recap-of-lucene-revolution/feed/</wfw:commentRss>
		<slash:comments>1</slash:comments>
		</item>
		<item>
		<title>Indexing Millions of Documents using Tika and Atomic Update</title>
		<link>http://www.opensourceconnections.com/2013/04/28/indexing-millions-of-documents-using-tika-and-atomic-update/</link>
		<comments>http://www.opensourceconnections.com/2013/04/28/indexing-millions-of-documents-using-tika-and-atomic-update/#comments</comments>
		<pubDate>Mon, 29 Apr 2013 02:41:48 +0000</pubDate>
		<dc:creator>Patricia Gorla</dc:creator>
				<category><![CDATA[solr]]></category>

		<guid isPermaLink="false">http://www.opensourceconnections.com/?p=3461</guid>
		<description><![CDATA[On a recent engagement, we were posed with the problem of sorting through 6.5 million foreign patent documents and indexing them into Solr. This totaled about 1 TB of XML text data alone. The full corpus included an additional 5 TB of images to incorporate into the index; this blog post will only cover the [...]]]></description>
		<wfw:commentRss>http://www.opensourceconnections.com/2013/04/28/indexing-millions-of-documents-using-tika-and-atomic-update/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
		<item>
		<title>Understanding Solr Soft Commits and Data Durability</title>
		<link>http://www.opensourceconnections.com/2013/04/25/understanding-solr-soft-commits-and-data-durability/</link>
		<comments>http://www.opensourceconnections.com/2013/04/25/understanding-solr-soft-commits-and-data-durability/#comments</comments>
		<pubDate>Fri, 26 Apr 2013 03:11:06 +0000</pubDate>
		<dc:creator>John Berryman</dc:creator>
				<category><![CDATA[solr]]></category>

		<guid isPermaLink="false">http://www.opensourceconnections.com/?p=3458</guid>
		<description><![CDATA[I ran into an interesting problem today. I was working with the first project where we legitimately needed Solr soft commits and in testing my configuration I wanted to prove to myself that the soft commits were performing as expected. Namely, I expected soft commits to flush all added documents to an in-RAM index so [...]]]></description>
		<wfw:commentRss>http://www.opensourceconnections.com/2013/04/25/understanding-solr-soft-commits-and-data-durability/feed/</wfw:commentRss>
		<slash:comments>1</slash:comments>
		</item>
		<item>
		<title>Beginner Tips for Elastic MapReduce</title>
		<link>http://www.opensourceconnections.com/2013/04/21/beginner-tips-for-elastic-mapreduce/</link>
		<comments>http://www.opensourceconnections.com/2013/04/21/beginner-tips-for-elastic-mapreduce/#comments</comments>
		<pubDate>Sun, 21 Apr 2013 20:58:23 +0000</pubDate>
		<dc:creator>John Berryman</dc:creator>
				<category><![CDATA[solr]]></category>

		<guid isPermaLink="false">http://www.opensourceconnections.com/?p=3430</guid>
		<description><![CDATA[By this point everyone is well acquainted with the power of Hadoop&#8217;s MapReduce. But what you&#8217;re also probably well acquainted with is the pain that must be suffered when setting up your own Hadoop cluster. Sure, there are some really good tutorials online if you know where to look: here is a great one for [...]]]></description>
		<wfw:commentRss>http://www.opensourceconnections.com/2013/04/21/beginner-tips-for-elastic-mapreduce/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
		<item>
		<title>Querying More Fields != More Results &#8212; Stop wording and Dismax&#8217;s mm (min should match) argument</title>
		<link>http://www.opensourceconnections.com/2013/04/15/querying-more-fields-more-results-stop-wording-and-solrs-mm-min-should-match-argument/</link>
		<comments>http://www.opensourceconnections.com/2013/04/15/querying-more-fields-more-results-stop-wording-and-solrs-mm-min-should-match-argument/#comments</comments>
		<pubDate>Mon, 15 Apr 2013 20:35:10 +0000</pubDate>
		<dc:creator>Doug Turnbull</dc:creator>
				<category><![CDATA[solr]]></category>

		<guid isPermaLink="false">http://www.opensourceconnections.com/?p=3349</guid>
		<description><![CDATA[Let’s recall from Anatomy of a Dismax Query some key components to the dismax query parser: qf – the fields we will search over (we’ll take the highest score out of all the fields that match) mm – the minimum number of fields that MUST match the query OK, now we&#8217;ve had plenty of time [...]]]></description>
		<wfw:commentRss>http://www.opensourceconnections.com/2013/04/15/querying-more-fields-more-results-stop-wording-and-solrs-mm-min-should-match-argument/feed/</wfw:commentRss>
		<slash:comments>1</slash:comments>
		</item>
		<item>
		<title>How to Debug Solr With Eclipse</title>
		<link>http://www.opensourceconnections.com/2013/04/13/how-to-debug-solr-with-eclipse/</link>
		<comments>http://www.opensourceconnections.com/2013/04/13/how-to-debug-solr-with-eclipse/#comments</comments>
		<pubDate>Sun, 14 Apr 2013 03:14:43 +0000</pubDate>
		<dc:creator>Doug Turnbull</dc:creator>
				<category><![CDATA[Programming]]></category>
		<category><![CDATA[solr]]></category>
		<category><![CDATA[debugging]]></category>
		<category><![CDATA[eclipse]]></category>

		<guid isPermaLink="false">http://www.opensourceconnections.com/?p=3314</guid>
		<description><![CDATA[Recently I was puzzled by some behavior Solr was showing me. I scratched my head and called over a colleague. We couldn&#8217;t quite figure out what was going on. Well Solr is open source so&#8230; next stop – Debuggersville! Running Solr in the Eclipse debugger isn’t hard, but there are many scattered user group posts [...]]]></description>
		<wfw:commentRss>http://www.opensourceconnections.com/2013/04/13/how-to-debug-solr-with-eclipse/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
		<item>
		<title>Modifying Solr Result Relevancy via an &#8220;Auxiliary Boost&#8221; Field</title>
		<link>http://www.opensourceconnections.com/2013/04/10/modifying-solr-result-relevancy-via-an-auxiliary-boost-field/</link>
		<comments>http://www.opensourceconnections.com/2013/04/10/modifying-solr-result-relevancy-via-an-auxiliary-boost-field/#comments</comments>
		<pubDate>Wed, 10 Apr 2013 19:49:55 +0000</pubDate>
		<dc:creator>John Berryman</dc:creator>
				<category><![CDATA[solr]]></category>

		<guid isPermaLink="false">http://www.opensourceconnections.com/?p=3294</guid>
		<description><![CDATA[English is a confusing language. I mean, does it really make sense that you can park in a driveway or drive in a parkway? Also, I&#8217;ve always been amused that there actually exists a class of words that are their own antonym &#8211; so called &#8220;auto-antonyms&#8221;: cleave &#8211; 1] Split or sever (something) 2] Stick [...]]]></description>
		<wfw:commentRss>http://www.opensourceconnections.com/2013/04/10/modifying-solr-result-relevancy-via-an-auxiliary-boost-field/feed/</wfw:commentRss>
		<slash:comments>3</slash:comments>
		</item>
		<item>
		<title>Beginners guide to enhancing Solr/Lucene search with Mahout&#8217;s Machine Learning</title>
		<link>http://www.opensourceconnections.com/2013/04/04/complete-n00bs-guide-to-enhancing-solrlucene-search-with-mahouts-machine-learning/</link>
		<comments>http://www.opensourceconnections.com/2013/04/04/complete-n00bs-guide-to-enhancing-solrlucene-search-with-mahouts-machine-learning/#comments</comments>
		<pubDate>Fri, 05 Apr 2013 04:02:11 +0000</pubDate>
		<dc:creator>Doug Turnbull</dc:creator>
				<category><![CDATA[Analytics]]></category>
		<category><![CDATA[Big Data]]></category>
		<category><![CDATA[Natural Language Processing]]></category>

		<guid isPermaLink="false">http://www.opensourceconnections.com/?p=3228</guid>
		<description><![CDATA[Yesterday, John and I gave a talk to the DC Hadoop Users Group about using Mahout with Solr to perform Latent Semantic Indexing &#8212; calculating and exploiting the semantic relationships between keywords. While we were there, I realized, a lot of people could benefit from a bigger picture, less in-depth, point of view outside of [...]]]></description>
		<wfw:commentRss>http://www.opensourceconnections.com/2013/04/04/complete-n00bs-guide-to-enhancing-solrlucene-search-with-mahouts-machine-learning/feed/</wfw:commentRss>
		<slash:comments>1</slash:comments>
		</item>
		<item>
		<title>OpenSource Connections to present at DC Hadoop User Group</title>
		<link>http://www.opensourceconnections.com/2013/04/01/opensource-connections-will-be-presenting-at-dc-hadoop-user-group/</link>
		<comments>http://www.opensourceconnections.com/2013/04/01/opensource-connections-will-be-presenting-at-dc-hadoop-user-group/#comments</comments>
		<pubDate>Mon, 01 Apr 2013 08:49:15 +0000</pubDate>
		<dc:creator>John Berryman</dc:creator>
				<category><![CDATA[solr]]></category>

		<guid isPermaLink="false">http://www.opensourceconnections.com/?p=3224</guid>
		<description><![CDATA[OpenSource Connections is investigating the use of Mahout(/Hadoop) to incorporate recommendations and Latent Semantic Indexing (LSI) into Solr search. In this fast-paced talk we&#8217;ll cover the theory behind recommenders and LSI (two-sides of the same coin), we&#8217;ll discuss why this project is a Big Data project and we&#8217;ll present our approach using a combination of [...]]]></description>
		<wfw:commentRss>http://www.opensourceconnections.com/2013/04/01/opensource-connections-will-be-presenting-at-dc-hadoop-user-group/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
		<item>
		<title>Debugging &#8220;Wrong FS expected: file:///&#8221; exception from HDFS</title>
		<link>http://www.opensourceconnections.com/2013/03/24/hdfs-debugging-wrong-fs-expected-file-exception/</link>
		<comments>http://www.opensourceconnections.com/2013/03/24/hdfs-debugging-wrong-fs-expected-file-exception/#comments</comments>
		<pubDate>Sun, 24 Mar 2013 16:46:33 +0000</pubDate>
		<dc:creator>Doug Turnbull</dc:creator>
				<category><![CDATA[Big Data]]></category>
		<category><![CDATA[hadoop]]></category>
		<category><![CDATA[Java]]></category>
		<category><![CDATA[hdfs]]></category>

		<guid isPermaLink="false">http://www.opensourceconnections.com/?p=3188</guid>
		<description><![CDATA[I just spent some time putting together some basic Java code to read some data from HDFS. Pretty basic stuff. No map reduce involved. Pretty boilerplate code like the stuff from this popular tutorial on the topic. No matter what, I kept hitting my head on this error: Exception in thread &#8220;main&#8221; java.lang.IllegalArgumentException: Wrong FS: [...]]]></description>
		<wfw:commentRss>http://www.opensourceconnections.com/2013/03/24/hdfs-debugging-wrong-fs-expected-file-exception/feed/</wfw:commentRss>
		<slash:comments>0</slash:comments>
		</item>
	</channel>
</rss>
