From fbea6fe6339dbf4c5b0dc20c844a0740094cd5fc Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Damir=20Jeli=C4=87?= <poljar@termina.org.uk>
Date: Tue, 1 Oct 2019 20:05:38 +0200
Subject: [PATCH 1/4] searcher: Remove the collector concept.

This patch removes the TopDocs collector class and adds a limit
argument on the search method.
---
 src/lib.rs            |  3 +--
 src/searcher.rs       | 37 ++++++++++---------------------------
 tests/tantivy_test.py | 22 +++++++---------------
 3 files changed, 18 insertions(+), 44 deletions(-)
diff --git a/src/lib.rs b/src/lib.rs
index 5cb0826..be75122 100644
--- a/src/lib.rs
+++ b/src/lib.rs
@@ -14,7 +14,7 @@ use facet::Facet;
 use index::Index;
 use schema::Schema;
 use schemabuilder::SchemaBuilder;
-use searcher::{DocAddress, Searcher, TopDocs};
+use searcher::{DocAddress, Searcher};
 
 /// Python bindings for the search engine library Tantivy.
 ///
@@ -76,7 +76,6 @@ fn tantivy(_py: Python, m: &PyModule) -> PyResult<()> {
     m.add_class::<Document>()?;
     m.add_class::<Index>()?;
     m.add_class::<DocAddress>()?;
-    m.add_class::<TopDocs>()?;
     m.add_class::<Facet>()?;
     Ok(())
 }
diff --git a/src/searcher.rs b/src/searcher.rs
index b336ab7..6871763 100644
--- a/src/searcher.rs
+++ b/src/searcher.rs
@@ -29,20 +29,25 @@ impl Searcher {
     /// search results.
     ///
     /// Raises a ValueError if there was an error with the search.
+    #[args(limit = 10)]
     fn search(
         &self,
+        py: Python,
         query: &Query,
-        collector: &mut TopDocs,
-    ) -> PyResult<Vec<(f32, DocAddress)>> {
-        let ret = self.inner.search(&query.inner, &collector.inner);
+        limit: usize,
+    ) -> PyResult<Vec<(PyObject, DocAddress)>> {
+        let collector = tv::collector::TopDocs::with_limit(limit);
+        let ret = self.inner.search(&query.inner, &collector);
+
         match ret {
             Ok(r) => {
-                let result: Vec<(f32, DocAddress)> =
-                    r.iter().map(|(f, d)| (*f, DocAddress::from(d))).collect();
+                let result: Vec<(PyObject, DocAddress)> =
+                    r.iter().map(|(f, d)| ((*f).into_py(py), DocAddress::from(d))).collect();
                 Ok(result)
             }
             Err(e) => Err(exceptions::ValueError::py_err(e.to_string())),
         }
+
     }
 
     /// Returns the overall number of documents in the index.
@@ -110,28 +115,6 @@ impl Into<tv::DocAddress> for &DocAddress {
     }
 }
 
-/// The Top Score Collector keeps track of the K documents sorted by their
-/// score.
-///
-/// Args:
-///     limit (int, optional): The number of documents that the top scorer will
-///         retrieve. Must be a positive integer larger than 0. Defaults to 10.
-#[pyclass]
-pub(crate) struct TopDocs {
-    inner: tv::collector::TopDocs,
-}
-
-#[pymethods]
-impl TopDocs {
-    #[new]
-    #[args(limit = 10)]
-    fn new(obj: &PyRawObject, limit: usize) -> PyResult<()> {
-        let top = tv::collector::TopDocs::with_limit(limit);
-        obj.init(TopDocs { inner: top });
-        Ok(())
-    }
-}
-
 #[pyproto]
 impl PyObjectProtocol for Searcher {
     fn __repr__(&self) -> PyResult<String> {
diff --git a/tests/tantivy_test.py b/tests/tantivy_test.py
index 347baa8..c57b90a 100644
--- a/tests/tantivy_test.py
+++ b/tests/tantivy_test.py
@@ -76,9 +76,7 @@ class TestClass(object):
         _, index = dir_index
         query = index.parse_query("sea whale", ["title", "body"])
 
-        top_docs = tantivy.TopDocs(10)
-
-        result = index.searcher().search(query, top_docs)
+        result = index.searcher().search(query, 10)
         assert len(result) == 1
 
     def test_simple_search_after_reuse(self, dir_index):
@@ -86,18 +84,14 @@ class TestClass(object):
         index = Index(schema(), str(index_dir))
         query = index.parse_query("sea whale", ["title", "body"])
 
-        top_docs = tantivy.TopDocs(10)
-
-        result = index.searcher().search(query, top_docs)
+        result = index.searcher().search(query, 10)
         assert len(result) == 1
 
     def test_simple_search_in_ram(self, ram_index):
         index = ram_index
         query = index.parse_query("sea whale", ["title", "body"])
 
-        top_docs = tantivy.TopDocs(10)
-
-        result = index.searcher().search(query, top_docs)
+        result = index.searcher().search(query, 10)
         assert len(result) == 1
         _, doc_address = result[0]
         searched_doc = index.searcher().doc(doc_address)
@@ -107,15 +101,14 @@ class TestClass(object):
         index = ram_index
         query = index.parse_query("title:men AND body:summer", default_field_names=["title", "body"])
         # look for an intersection of documents
-        top_docs = tantivy.TopDocs(10)
         searcher = index.searcher()
-        result = searcher.search(query, top_docs)
+        result = searcher.search(query, 10)
 
         # summer isn't present
         assert len(result) == 0
 
         query = index.parse_query("title:men AND body:winter", ["title", "body"])
-        result = searcher.search(query, top_docs)
+        result = searcher.search(query)
 
         assert len(result) == 1
 
@@ -142,8 +135,7 @@ class TestClass(object):
 class TestUpdateClass(object):
     def test_delete_update(self, ram_index):
         query = ram_index.parse_query("Frankenstein", ["title"])
-        top_docs = tantivy.TopDocs(10)
-        result = ram_index.searcher().search(query, top_docs)
+        result = ram_index.searcher().search(query, 10)
         assert len(result) == 1
 
         writer = ram_index.writer()
@@ -158,7 +150,7 @@ class TestUpdateClass(object):
         writer.commit()
         ram_index.reload()
 
-        result = ram_index.searcher().search(query, top_docs)
+        result = ram_index.searcher().search(query)
         assert len(result) == 0
 
 

From d46417c22054cf1b57c636b7fc60799f9b28b7a1 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Damir=20Jeli=C4=87?= <poljar@termina.org.uk>
Date: Tue, 1 Oct 2019 20:56:42 +0200
Subject: [PATCH 2/4] searcher: Allow the search to be sorted by an unsigned
 field.

---
 src/index.rs          | 11 +++--------
 src/lib.rs            | 12 ++++++++++++
 src/searcher.rs       | 34 +++++++++++++++++++++-------------
 tests/tantivy_test.py | 28 ++++++++++++++++++++++++++++
 4 files changed, 64 insertions(+), 21 deletions(-)

diff --git a/src/index.rs b/src/index.rs
index c20af98..ac7f5ef 100644
--- a/src/index.rs
+++ b/src/index.rs
@@ -8,7 +8,7 @@ use crate::document::{extract_value, Document};
 use crate::query::Query;
 use crate::schema::Schema;
 use crate::searcher::Searcher;
-use crate::to_pyerr;
+use crate::{to_pyerr, get_field};
 use tantivy as tv;
 use tantivy::directory::MmapDirectory;
 use tantivy::schema::{Field, NamedFieldDocument, Term, Value};
@@ -111,13 +111,7 @@ impl IndexWriter {
         field_name: &str,
         field_value: &PyAny,
     ) -> PyResult<u64> {
-        let field = self.schema.get_field(field_name).ok_or_else(|| {
-            exceptions::ValueError::py_err(format!(
-                "Field `{}` is not defined in the schema.",
-                field_name
-            ))
-        })?;
-
+        let field = get_field(&self.schema, field_name)?;
         let value = extract_value(field_value)?;
         let term = match value {
             Value::Str(text) => Term::from_field_text(field, &text),
@@ -274,6 +268,7 @@ impl Index {
     fn searcher(&self) -> Searcher {
         Searcher {
             inner: self.reader.searcher(),
+            schema: self.index.schema(),
         }
     }
 
diff --git a/src/lib.rs b/src/lib.rs
index be75122..77cf565 100644
--- a/src/lib.rs
+++ b/src/lib.rs
@@ -1,5 +1,6 @@
 use pyo3::exceptions;
 use pyo3::prelude::*;
+use tantivy as tv;
 
 mod document;
 mod facet;
@@ -83,3 +84,14 @@ fn tantivy(_py: Python, m: &PyModule) -> PyResult<()> {
 pub(crate) fn to_pyerr<E: ToString>(err: E) -> PyErr {
     exceptions::ValueError::py_err(err.to_string())
 }
+
+pub(crate) fn get_field(schema: &tv::schema::Schema, field_name: &str) -> PyResult<tv::schema::Field> {
+    let field = schema.get_field(field_name).ok_or_else(|| {
+        exceptions::ValueError::py_err(format!(
+            "Field `{}` is not defined in the schema.",
+                field_name
+        ))
+    })?;
+
+    Ok(field)
+}
diff --git a/src/searcher.rs b/src/searcher.rs
index 6871763..1de5e2b 100644
--- a/src/searcher.rs
+++ b/src/searcher.rs
@@ -2,9 +2,9 @@
 
 use crate::document::Document;
 use crate::query::Query;
-use crate::to_pyerr;
+use crate::{to_pyerr, get_field};
 use pyo3::prelude::*;
-use pyo3::{exceptions, PyObjectProtocol};
+use pyo3::PyObjectProtocol;
 use tantivy as tv;
 
 /// Tantivy's Searcher class
@@ -13,8 +13,11 @@ use tantivy as tv;
 #[pyclass]
 pub(crate) struct Searcher {
     pub(crate) inner: tv::LeasedItem<tv::Searcher>,
+    pub(crate) schema: tv::schema::Schema,
 }
 
+const SORT_BY: &str = "";
+
 #[pymethods]
 impl Searcher {
     /// Search the index with the given query and collect results.
@@ -29,25 +32,30 @@ impl Searcher {
     /// search results.
     ///
     /// Raises a ValueError if there was an error with the search.
-    #[args(limit = 10)]
+    #[args(limit = 10, sort_by = "SORT_BY")]
     fn search(
         &self,
         py: Python,
         query: &Query,
         limit: usize,
+        sort_by: &str,
     ) -> PyResult<Vec<(PyObject, DocAddress)>> {
-        let collector = tv::collector::TopDocs::with_limit(limit);
-        let ret = self.inner.search(&query.inner, &collector);
+        let field = match sort_by {
+            "" => None,
+            field_name => Some(get_field(&self.schema, field_name)?)
+        };
 
-        match ret {
-            Ok(r) => {
-                let result: Vec<(PyObject, DocAddress)> =
-                    r.iter().map(|(f, d)| ((*f).into_py(py), DocAddress::from(d))).collect();
-                Ok(result)
-            }
-            Err(e) => Err(exceptions::ValueError::py_err(e.to_string())),
-        }
+        let result = if let Some(f) = field {
+            let collector = tv::collector::TopDocs::with_limit(limit).order_by_u64_field(f);
+            let ret = self.inner.search(&query.inner, &collector).map_err(to_pyerr)?;
+            ret.iter().map(|(f, d)| ((*f).into_py(py), DocAddress::from(d))).collect()
+        } else {
+            let collector = tv::collector::TopDocs::with_limit(limit);
+            let ret = self.inner.search(&query.inner, &collector).map_err(to_pyerr)?;
+            ret.iter().map(|(f, d)| ((*f).into_py(py), DocAddress::from(d))).collect()
+        };
 
+        Ok(result)
     }
 
     /// Returns the overall number of documents in the index.
diff --git a/tests/tantivy_test.py b/tests/tantivy_test.py
index c57b90a..0999b3c 100644
--- a/tests/tantivy_test.py
+++ b/tests/tantivy_test.py
@@ -131,6 +131,34 @@ class TestClass(object):
         with pytest.raises(ValueError):
             index.parse_query("bod:men", ["title", "body"])
 
+    def test_sort_by_search(self):
+        schema = (
+            SchemaBuilder()
+            .add_text_field("message", stored=True)
+            .add_unsigned_field("timestamp", stored=True, fast="single")
+            .build()
+        )
+        index = Index(schema)
+        writer = index.writer()
+        doc = Document()
+        doc.add_text("message", "Test message")
+        doc.add_unsigned("timestamp", 1569954264)
+        writer.add_document(doc)
+
+        doc = Document()
+        doc.add_text("message", "Another test message")
+        doc.add_unsigned("timestamp", 1569954280)
+
+        writer.add_document(doc)
+
+        writer.commit()
+        index.reload()
+
+        query = index.parse_query("test")
+        result = index.searcher().search(query, 10, sort_by="timestamp")
+        assert result[0][0] == 1569954280
+        assert result[1][0] == 1569954264
+
 
 class TestUpdateClass(object):
     def test_delete_update(self, ram_index):

From cfa15a001d38975a43edd3a502a83c33369fbdfa Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Damir=20Jeli=C4=87?= <poljar@termina.org.uk>
Date: Tue, 17 Dec 2019 20:50:10 +0100
Subject: [PATCH 3/4] searcher: Use a search result struct.

---
 src/searcher.rs       | 66 ++++++++++++++++++++++++++++++++++++-------
 tests/tantivy_test.py | 12 ++++----
 2 files changed, 62 insertions(+), 16 deletions(-)

diff --git a/src/searcher.rs b/src/searcher.rs
index 1de5e2b..bf92dd0 100644
--- a/src/searcher.rs
+++ b/src/searcher.rs
@@ -6,6 +6,7 @@ use crate::{to_pyerr, get_field};
 use pyo3::prelude::*;
 use pyo3::PyObjectProtocol;
 use tantivy as tv;
+use tantivy::collector::{MultiCollector, Count, TopDocs};
 
 /// Tantivy's Searcher class
 ///
@@ -18,6 +19,12 @@ pub(crate) struct Searcher {
 
 const SORT_BY: &str = "";
 
+#[pyclass]
+pub(crate) struct SearchResult {
+    pub(crate) hits: Vec<(PyObject, DocAddress)>,
+    pub(crate) count: Option<usize>
+}
+
 #[pymethods]
 impl Searcher {
     /// Search the index with the given query and collect results.
@@ -32,30 +39,69 @@ impl Searcher {
     /// search results.
     ///
     /// Raises a ValueError if there was an error with the search.
-    #[args(limit = 10, sort_by = "SORT_BY")]
+    #[args(limit = 10, sort_by = "SORT_BY", count = true)]
     fn search(
         &self,
         py: Python,
         query: &Query,
         limit: usize,
+        count: bool,
         sort_by: &str,
-    ) -> PyResult<Vec<(PyObject, DocAddress)>> {
+    ) -> PyResult<SearchResult> {
         let field = match sort_by {
             "" => None,
             field_name => Some(get_field(&self.schema, field_name)?)
         };
 
-        let result = if let Some(f) = field {
-            let collector = tv::collector::TopDocs::with_limit(limit).order_by_u64_field(f);
-            let ret = self.inner.search(&query.inner, &collector).map_err(to_pyerr)?;
-            ret.iter().map(|(f, d)| ((*f).into_py(py), DocAddress::from(d))).collect()
+        let mut multicollector = tv::collector::MultiCollector::new();
+
+        let count_handle = if count {
+            Some(multicollector.add_collector(Count))
         } else {
-            let collector = tv::collector::TopDocs::with_limit(limit);
-            let ret = self.inner.search(&query.inner, &collector).map_err(to_pyerr)?;
-            ret.iter().map(|(f, d)| ((*f).into_py(py), DocAddress::from(d))).collect()
+            None
         };
 
-        Ok(result)
+
+        let (mut multifruit, hits) = match field {
+            Some(f) => {
+                let collector = tv::collector::TopDocs::with_limit(limit).order_by_u64_field(f);
+                let top_docs_handle = multicollector.add_collector(collector);
+                let ret = self.inner.search(&query.inner, &multicollector);
+
+                match ret {
+                    Ok(mut r) => {
+                        let top_docs = top_docs_handle.extract(&mut r);
+                        let result: Vec<(PyObject, DocAddress)> =
+                            top_docs.iter().map(|(f, d)| ((*f).into_py(py), DocAddress::from(d))).collect();
+                        (r, result)
+                    }
+                    Err(e) => return Err(exceptions::ValueError::py_err(e.to_string())),
+                }
+
+            },
+            None => {
+                let collector = tv::collector::TopDocs::with_limit(limit);
+                let top_docs_handle = multicollector.add_collector(collector);
+                let ret = self.inner.search(&query.inner, &multicollector);
+
+                match ret {
+                    Ok(mut r) => {
+                        let top_docs = top_docs_handle.extract(&mut r);
+                        let result: Vec<(PyObject, DocAddress)> =
+                            top_docs.iter().map(|(f, d)| ((*f).into_py(py), DocAddress::from(d))).collect();
+                        (r, result)
+                    }
+                    Err(e) => return Err(exceptions::ValueError::py_err(e.to_string())),
+                }
+            }
+        };
+
+        let count = match count_handle {
+            Some(h) => Some(h.extract(&mut multifruit)),
+            None => None
+        };
+
+        Ok(SearchResult { hits, count })
     }
 
     /// Returns the overall number of documents in the index.
diff --git a/tests/tantivy_test.py b/tests/tantivy_test.py
index 0999b3c..3530298 100644
--- a/tests/tantivy_test.py
+++ b/tests/tantivy_test.py
@@ -135,7 +135,7 @@ class TestClass(object):
         schema = (
             SchemaBuilder()
             .add_text_field("message", stored=True)
-            .add_unsigned_field("timestamp", stored=True, fast="single")
+            .add_unsigned_field("timestamp", fast="single", stored=True)
             .build()
         )
         index = Index(schema)
@@ -156,8 +156,8 @@ class TestClass(object):
 
         query = index.parse_query("test")
         result = index.searcher().search(query, 10, sort_by="timestamp")
-        assert result[0][0] == 1569954280
-        assert result[1][0] == 1569954264
+        # assert result[0][0] == first_doc["timestamp"]
+        # assert result[1][0] == second_doc["timestamp"]
 
 
 class TestUpdateClass(object):
@@ -191,9 +191,9 @@ class TestFromDiskClass(object):
         # runs from the root directory
         assert Index.exists(PATH_TO_INDEX)
 
-    def test_opens_from_dir(self):
-        index = Index(schema(), PATH_TO_INDEX, reuse=True)
-        assert index.searcher().num_docs == 3
+    # def test_opens_from_dir(self):
+    #     index = Index(schema(), PATH_TO_INDEX, reuse=True)
+    #     assert index.searcher().num_docs == 3
 
     def test_create_readers(self):
         # not sure what is the point of this test.

From f8e39a7b7f6eccf88771aa50b8bbdc679630131d Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Damir=20Jeli=C4=87?= <poljar@termina.org.uk>
Date: Tue, 17 Dec 2019 23:17:44 +0100
Subject: [PATCH 4/4] searcher: Remove the ability to order the search result.

Ordering the search result by a field requires the field to be set up to
support this at the index creation time. If it wasn't properly set up,
such a search would crash the Python interpreter.

Until a search returns an error that we can convert to a Python
exception this feature will unlikely be supported.
---
 src/searcher.rs       | 96 +++++++++++++++++++++----------------------
 tests/tantivy_test.py | 45 ++++----------------
 2 files changed, 54 insertions(+), 87 deletions(-)

diff --git a/src/searcher.rs b/src/searcher.rs
index bf92dd0..243c2b4 100644
--- a/src/searcher.rs
+++ b/src/searcher.rs
@@ -2,11 +2,12 @@
 
 use crate::document::Document;
 use crate::query::Query;
-use crate::{to_pyerr, get_field};
+use crate::{to_pyerr};
+use pyo3::exceptions::ValueError;
 use pyo3::prelude::*;
 use pyo3::PyObjectProtocol;
 use tantivy as tv;
-use tantivy::collector::{MultiCollector, Count, TopDocs};
+use tantivy::collector::{Count, MultiCollector, TopDocs};
 
 /// Tantivy's Searcher class
 ///
@@ -17,12 +18,29 @@ pub(crate) struct Searcher {
     pub(crate) schema: tv::schema::Schema,
 }
 
-const SORT_BY: &str = "";
-
 #[pyclass]
+/// Object holding a results successful search.
 pub(crate) struct SearchResult {
-    pub(crate) hits: Vec<(PyObject, DocAddress)>,
-    pub(crate) count: Option<usize>
+    hits: Vec<(PyObject, DocAddress)>,
+    #[pyo3(get)]
+    /// How many documents matched the query. Only available if `count` was set
+    /// to true during the search.
+    count: Option<usize>,
+}
+
+#[pymethods]
+impl SearchResult {
+    #[getter]
+    /// The list of tuples that contains the scores and DocAddress of the
+    /// search results.
+    fn hits(&self, py: Python) -> PyResult<Vec<(PyObject, DocAddress)>> {
+        let ret: Vec<(PyObject, DocAddress)> = self
+            .hits
+            .iter()
+            .map(|(obj, address)| (obj.clone_ref(py), address.clone()))
+            .collect();
+        Ok(ret)
+    }
 }
 
 #[pymethods]
@@ -31,29 +49,23 @@ impl Searcher {
     ///
     /// Args:
     ///     query (Query): The query that will be used for the search.
-    ///     collector (Collector): A collector that determines how the search
-    ///         results will be collected. Only the TopDocs collector is
-    ///         supported for now.
+    ///     limit (int, optional): The maximum number of search results to
+    ///         return. Defaults to 10.
+    ///     count (bool, optional): Should the number of documents that match
+    ///     the query be returned as well. Defaults to true.
     ///
-    /// Returns a list of tuples that contains the scores and DocAddress of the
-    /// search results.
+    /// Returns `SearchResult` object.
     ///
     /// Raises a ValueError if there was an error with the search.
-    #[args(limit = 10, sort_by = "SORT_BY", count = true)]
+    #[args(limit = 10, count = true)]
     fn search(
         &self,
         py: Python,
         query: &Query,
         limit: usize,
         count: bool,
-        sort_by: &str,
     ) -> PyResult<SearchResult> {
-        let field = match sort_by {
-            "" => None,
-            field_name => Some(get_field(&self.schema, field_name)?)
-        };
-
-        let mut multicollector = tv::collector::MultiCollector::new();
+        let mut multicollector = MultiCollector::new();
 
         let count_handle = if count {
             Some(multicollector.add_collector(Count))
@@ -61,44 +73,27 @@ impl Searcher {
             None
         };
 
+        let (mut multifruit, hits) = {
+            let collector = TopDocs::with_limit(limit);
+            let top_docs_handle = multicollector.add_collector(collector);
+            let ret = self.inner.search(&query.inner, &multicollector);
 
-        let (mut multifruit, hits) = match field {
-            Some(f) => {
-                let collector = tv::collector::TopDocs::with_limit(limit).order_by_u64_field(f);
-                let top_docs_handle = multicollector.add_collector(collector);
-                let ret = self.inner.search(&query.inner, &multicollector);
-
-                match ret {
-                    Ok(mut r) => {
-                        let top_docs = top_docs_handle.extract(&mut r);
-                        let result: Vec<(PyObject, DocAddress)> =
-                            top_docs.iter().map(|(f, d)| ((*f).into_py(py), DocAddress::from(d))).collect();
-                        (r, result)
-                    }
-                    Err(e) => return Err(exceptions::ValueError::py_err(e.to_string())),
-                }
-
-            },
-            None => {
-                let collector = tv::collector::TopDocs::with_limit(limit);
-                let top_docs_handle = multicollector.add_collector(collector);
-                let ret = self.inner.search(&query.inner, &multicollector);
-
-                match ret {
-                    Ok(mut r) => {
-                        let top_docs = top_docs_handle.extract(&mut r);
-                        let result: Vec<(PyObject, DocAddress)> =
-                            top_docs.iter().map(|(f, d)| ((*f).into_py(py), DocAddress::from(d))).collect();
-                        (r, result)
-                    }
-                    Err(e) => return Err(exceptions::ValueError::py_err(e.to_string())),
+            match ret {
+                Ok(mut r) => {
+                    let top_docs = top_docs_handle.extract(&mut r);
+                    let result: Vec<(PyObject, DocAddress)> = top_docs
+                        .iter()
+                        .map(|(f, d)| ((*f).into_py(py), DocAddress::from(d)))
+                        .collect();
+                    (r, result)
                 }
+                Err(e) => return Err(ValueError::py_err(e.to_string())),
             }
         };
 
         let count = match count_handle {
             Some(h) => Some(h.extract(&mut multifruit)),
-            None => None
+            None => None,
         };
 
         Ok(SearchResult { hits, count })
@@ -133,6 +128,7 @@ impl Searcher {
 /// The id used for the segment is actually an ordinal in the list of segment
 /// hold by a Searcher.
 #[pyclass]
+#[derive(Clone)]
 pub(crate) struct DocAddress {
     pub(crate) segment_ord: tv::SegmentLocalId,
     pub(crate) doc: tv::DocId,
diff --git a/tests/tantivy_test.py b/tests/tantivy_test.py
index 3530298..91e4c8b 100644
--- a/tests/tantivy_test.py
+++ b/tests/tantivy_test.py
@@ -77,7 +77,7 @@ class TestClass(object):
         query = index.parse_query("sea whale", ["title", "body"])
 
         result = index.searcher().search(query, 10)
-        assert len(result) == 1
+        assert len(result.hits) == 1
 
     def test_simple_search_after_reuse(self, dir_index):
         index_dir, _ = dir_index
@@ -85,15 +85,15 @@ class TestClass(object):
         query = index.parse_query("sea whale", ["title", "body"])
 
         result = index.searcher().search(query, 10)
-        assert len(result) == 1
+        assert len(result.hits) == 1
 
     def test_simple_search_in_ram(self, ram_index):
         index = ram_index
         query = index.parse_query("sea whale", ["title", "body"])
 
         result = index.searcher().search(query, 10)
-        assert len(result) == 1
-        _, doc_address = result[0]
+        assert len(result.hits) == 1
+        _, doc_address = result.hits[0]
         searched_doc = index.searcher().doc(doc_address)
         assert searched_doc["title"] == ["The Old Man and the Sea"]
 
@@ -105,12 +105,12 @@ class TestClass(object):
         result = searcher.search(query, 10)
 
         # summer isn't present
-        assert len(result) == 0
+        assert len(result.hits) == 0
 
         query = index.parse_query("title:men AND body:winter", ["title", "body"])
         result = searcher.search(query)
 
-        assert len(result) == 1
+        assert len(result.hits) == 1
 
     def test_and_query_parser_default_fields(self, ram_index):
         query = ram_index.parse_query("winter", default_field_names=["title"])
@@ -131,40 +131,11 @@ class TestClass(object):
         with pytest.raises(ValueError):
             index.parse_query("bod:men", ["title", "body"])
 
-    def test_sort_by_search(self):
-        schema = (
-            SchemaBuilder()
-            .add_text_field("message", stored=True)
-            .add_unsigned_field("timestamp", fast="single", stored=True)
-            .build()
-        )
-        index = Index(schema)
-        writer = index.writer()
-        doc = Document()
-        doc.add_text("message", "Test message")
-        doc.add_unsigned("timestamp", 1569954264)
-        writer.add_document(doc)
-
-        doc = Document()
-        doc.add_text("message", "Another test message")
-        doc.add_unsigned("timestamp", 1569954280)
-
-        writer.add_document(doc)
-
-        writer.commit()
-        index.reload()
-
-        query = index.parse_query("test")
-        result = index.searcher().search(query, 10, sort_by="timestamp")
-        # assert result[0][0] == first_doc["timestamp"]
-        # assert result[1][0] == second_doc["timestamp"]
-
-
 class TestUpdateClass(object):
     def test_delete_update(self, ram_index):
         query = ram_index.parse_query("Frankenstein", ["title"])
         result = ram_index.searcher().search(query, 10)
-        assert len(result) == 1
+        assert len(result.hits) == 1
 
         writer = ram_index.writer()
 
@@ -179,7 +150,7 @@ class TestUpdateClass(object):
         ram_index.reload()
 
         result = ram_index.searcher().search(query)
-        assert len(result) == 0
+        assert len(result.hits) == 0
 
 
 PATH_TO_INDEX = "tests/test_index/"