lucy-commits mailing list archives

Site index · List index
Message view « Date » · « Thread »
Top « Date » · « Thread »
From nwelln...@apache.org
Subject [lucy-commits] [15/15] git commit: refs/heads/install-c-library - Sample program using the C library
Date Sat, 18 May 2013 19:24:00 GMT
Sample program using the C library


Project: http://git-wip-us.apache.org/repos/asf/lucy/repo
Commit: http://git-wip-us.apache.org/repos/asf/lucy/commit/27018f3b
Tree: http://git-wip-us.apache.org/repos/asf/lucy/tree/27018f3b
Diff: http://git-wip-us.apache.org/repos/asf/lucy/diff/27018f3b

Branch: refs/heads/install-c-library
Commit: 27018f3bad5155fba446c3083d86f2cf641eb5ab
Parents: acb55b7
Author: Nick Wellnhofer <wellnhofer@aevum.de>
Authored: Sat May 18 21:19:19 2013 +0200
Committer: Nick Wellnhofer <wellnhofer@aevum.de>
Committed: Sat May 18 21:19:19 2013 +0200

----------------------------------------------------------------------
 c/sample/getting_started.c |  189 +++++++++++++++++++++++++++++++++++++++
 1 files changed, 189 insertions(+), 0 deletions(-)
----------------------------------------------------------------------


http://git-wip-us.apache.org/repos/asf/lucy/blob/27018f3b/c/sample/getting_started.c
----------------------------------------------------------------------
diff --git a/c/sample/getting_started.c b/c/sample/getting_started.c
new file mode 100644
index 0000000..0f1f637
--- /dev/null
+++ b/c/sample/getting_started.c
@@ -0,0 +1,189 @@
+/* Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+/*
+ * Sample program to get started with the Apache Lucy C library.
+ *
+ * Creates an index with a few documents and conducts a few searches.
+ *
+ * If $PREFIX points to your installation directory, it can be compiled with:
+ *
+ *     c99 \
+ *         getting_started.c \
+ *         -I $PREFIX/include -L $PREFIX/lib -l lucy \
+ *         -o getting_started
+ */
+
+#include <stdio.h>
+#include <string.h>
+
+#define LUCY_USE_SHORT_NAMES
+#include "Clownfish/CharBuf.h"
+#include "Lucy/Analysis/EasyAnalyzer.h"
+#include "Lucy/Document/Doc.h"
+#include "Lucy/Document/HitDoc.h"
+#include "Lucy/Index/Indexer.h"
+#include "Lucy/Plan/FullTextType.h"
+#include "Lucy/Plan/Schema.h"
+#include "Lucy/Search/Hits.h"
+#include "Lucy/Search/IndexSearcher.h"
+
+static Schema*
+S_create_schema();
+
+static void
+S_index_documents(Schema *schema, CharBuf *folder);
+
+static void
+S_add_document(Indexer *indexer, const char *title, const char *content);
+
+static void
+S_search(IndexSearcher *searcher, const char *query);
+
+int
+main() {
+    // Initialize the library.
+    lucy_bootstrap_parcel();
+
+    Schema  *schema = S_create_schema();
+    CharBuf *folder = CB_newf("lucy_index");
+
+    S_index_documents(schema, folder);
+
+    IndexSearcher *searcher = IxSearcher_new((Obj*)folder);
+
+    S_search(searcher, "ullamco");
+    S_search(searcher, "ut OR laborum");
+    S_search(searcher, "\"fugiat nulla\"");
+
+    DECREF(schema);
+    DECREF(folder);
+    DECREF(searcher);
+    return 0;
+}
+
+static Schema*
+S_create_schema() {
+    // Create a new schema.
+    Schema *schema = Schema_new();
+
+    // Create an analyzer.
+    CharBuf      *language = CB_newf("en");
+    EasyAnalyzer *analyzer = EasyAnalyzer_new(language);
+
+    // Specify fields.
+
+    FullTextType *type = FullTextType_new((Analyzer*)analyzer);
+
+    {
+        CharBuf *field_cb = CB_newf("title");
+        Schema_Spec_Field(schema, field_cb, (FieldType*)type);
+        DECREF(field_cb);
+    }
+
+    {
+        CharBuf *field_cb = CB_newf("content");
+        Schema_Spec_Field(schema, field_cb, (FieldType*)type);
+        DECREF(field_cb);
+    }
+
+    DECREF(language);
+    DECREF(analyzer);
+    DECREF(type);
+    return schema;
+}
+
+static void
+S_index_documents(Schema *schema, CharBuf *folder) {
+    Indexer *indexer = Indexer_new(schema, (Obj*)folder, NULL,
+                                   Indexer_CREATE | Indexer_TRUNCATE);
+
+    S_add_document(indexer, "Lorem ipsum",
+        "Lorem ipsum dolor sit amet, consectetur adipisicing elit, sed do"
+        " eiusmod tempor incididunt ut labore et dolore magna aliqua."
+    );
+    S_add_document(indexer, "Ut enim",
+        "Ut enim ad minim veniam, quis nostrud exercitation ullamco laboris"
+        " nisi ut aliquip ex ea commodo consequat."
+    );
+    S_add_document(indexer, "Duis aute",
+        "Duis aute irure dolor in reprehenderit in voluptate velit essei"
+        " cillum dolore eu fugiat nulla pariatur."
+    );
+    S_add_document(indexer, "Excepteur sint",
+        "Excepteur sint occaecat cupidatat non proident, sunt in culpa qui"
+        " officia deserunt mollit anim id est laborum."
+    );
+
+    Indexer_Commit(indexer);
+}
+
+static void
+S_add_document(Indexer *indexer, const char *title, const char *content) {
+    Doc *doc = Doc_new(NULL, 0);
+
+    {
+        // Store 'title' field   
+        CharBuf *field_cb = CB_newf("title");
+        CharBuf *value_cb = CB_new_from_utf8(title, strlen(title));
+        Doc_Store(doc, field_cb, (Obj*)value_cb);
+        DECREF(field_cb);
+        DECREF(value_cb);
+    }
+
+    {
+        // Store 'content' field   
+        CharBuf *field_cb = CB_newf("content");
+        CharBuf *value_cb = CB_new_from_utf8(content, strlen(content));
+        Doc_Store(doc, field_cb, (Obj*)value_cb);
+        DECREF(field_cb);
+        DECREF(value_cb);
+    }
+
+    Indexer_Add_Doc(indexer, doc, 1.0);
+
+    DECREF(doc);
+}
+
+static void
+S_search(IndexSearcher *searcher, const char *query) {
+    printf("Searching for: %s\n", query);
+
+    // Execute search query.
+    CharBuf *query_cb = CB_new_from_utf8(query, strlen(query));
+    Hits    *hits     = IxSearcher_Hits(searcher, (Obj*)query_cb, 0, 10, NULL);
+
+    CharBuf *field_cb = CB_newf("title");
+    HitDoc  *hit;
+    int i = 1;
+
+    // Loop over search results.
+    while (NULL != (hit = Hits_Next(hits))) {
+        CharBuf *value_cb = (CharBuf*)HitDoc_Extract(hit, field_cb, NULL);
+
+        printf("Result %d: %s\n", i, CB_Get_Ptr8(value_cb));
+
+        DECREF(hit);
+        i++;
+    }
+
+    printf("\n");
+
+    DECREF(query_cb);
+    DECREF(hits);
+    DECREF(field_cb);
+}
+


Mime
View raw message