readthedocs · ericholscher · Dec 7, 2017 · Dec 7, 2017 · Dec 7, 2017 · Dec 7, 2017
diff --git a/readthedocs/core/management/commands/reindex_elasticsearch.py b/readthedocs/core/management/commands/reindex_elasticsearch.py
@@ -29,15 +29,15 @@ def handle(self, *args, **options):
         """Build/index all versions or a single project's version"""
         project = options['project']
 
-        queryset = Version.objects.all()
+        queryset = Version.objects.filter(active=True)
 
         if project:
             queryset = queryset.filter(project__slug=project)
             if not queryset.exists():
                 raise CommandError(
                     'No project with slug: {slug}'.format(slug=project))
             log.info("Building all versions for %s", project)
-        elif getattr(settings, 'INDEX_ONLY_LATEST', True):
+        if getattr(settings, 'INDEX_ONLY_LATEST', True):
             queryset = queryset.filter(slug=LATEST)
 
         for version in queryset:

diff --git a/readthedocs/restapi/urls.py b/readthedocs/restapi/urls.py
@@ -47,7 +47,7 @@
     url(r'index_search/',
         search_views.index_search,
         name='index_search'),
-    url(r'search/$', views.search_views.search, name='api_search'),
+    url(r'^search/$', views.search_views.search, name='api_search'),
     url(r'search/project/$',
         search_views.project_search,
         name='api_project_search'),

diff --git a/readthedocs/restapi/utils.py b/readthedocs/restapi/utils.py
@@ -141,11 +141,10 @@ def index_search_request(version, page_list, commit, project_scale, page_scale,
                     'weight': page_scale,
                 })
             for route in routes:
-                section_obj.bulk_index(section_index_list, parent=page_id,
-                                       routing=route)
+                section_obj.bulk_index(section_index_list, routing=route)
 
     for route in routes:
-        page_obj.bulk_index(index_list, parent=project.slug, routing=route)
+        page_obj.bulk_index(index_list, routing=route)
 
     if delete:
         log.info("Deleting files not in commit: %s", commit)

diff --git a/readthedocs/restapi/views/footer_views.py b/readthedocs/restapi/views/footer_views.py
@@ -43,7 +43,7 @@ def get_version_compare_data(project, base_version=None):
     }
     if highest_version_obj:
         ret_val['url'] = highest_version_obj.get_absolute_url()
-        ret_val['slug'] = highest_version_obj.slug,
+        ret_val['slug'] = highest_version_obj.slug
     if base_version and base_version.slug != LATEST:
         try:
             base_version_comparable = parse_version_failsafe(

diff --git a/readthedocs/search/indexes.py b/readthedocs/search/indexes.py
@@ -19,7 +19,7 @@
 import datetime
 
 from elasticsearch import Elasticsearch, exceptions
-from elasticsearch.helpers import bulk_index
+from elasticsearch.helpers import bulk
 
 from django.conf import settings
 
@@ -48,8 +48,6 @@ def get_settings(self, settings_override=None):
             'number_of_replicas': settings.ES_DEFAULT_NUM_REPLICAS,
             'number_of_shards': settings.ES_DEFAULT_NUM_SHARDS,
             'refresh_interval': '5s',
-            'store.compress.tv': True,
-            'store.compress.stored': True,
             'analysis': self.get_analysis(),
         }
         if settings_override:
@@ -139,7 +137,7 @@ def bulk_index(self, data, index=None, chunk_size=500, parent=None,
             docs.append(doc)
 
         # TODO: This doesn't work with the new ES setup.
-        bulk_index(self.es, docs, chunk_size=chunk_size)
+        bulk(self.es, docs, chunk_size=chunk_size)
 
     def index_document(self, data, index=None, parent=None, routing=None):
         doc = self.extract_document(data)
@@ -220,25 +218,24 @@ def get_mapping(self):
                 # Disable _all field to reduce index size.
                 '_all': {'enabled': False},
                 'properties': {
-                    'id': {'type': 'long'},
-                    'name': {'type': 'string', 'analyzer': 'default_icu'},
-                    'description': {'type': 'string', 'analyzer': 'default_icu'},
-
-                    'slug': {'type': 'string', 'index': 'not_analyzed'},
-                    'lang': {'type': 'string', 'index': 'not_analyzed'},
-                    'tags': {'type': 'string', 'index': 'not_analyzed'},
-                    'privacy': {'type': 'string', 'index': 'not_analyzed'},
+                    'id': {'type': 'keyword'},
+                    'name': {'type': 'text', 'analyzer': 'default_icu'},
+                    'description': {'type': 'text', 'analyzer': 'default_icu'},
+
+                    'slug': {'type': 'keyword'},
+                    'lang': {'type': 'keyword'},
+                    'tags': {'type': 'keyword'},
+                    'privacy': {'type': 'keyword'},
                     'author': {
-                        'type': 'string',
+                        'type': 'text',
                         'analyzer': 'default_icu',
                         'fields': {
                             'raw': {
-                                'type': 'string',
-                                'index': 'not_analyzed',
+                                'type': 'keyword',
                             },
                         },
                     },
-                    'url': {'type': 'string', 'index': 'not_analyzed'},
+                    'url': {'type': 'keyword'},
                     # Add a weight field to enhance relevancy scoring.
                     'weight': {'type': 'float'},
                 }
@@ -273,19 +270,19 @@ def get_mapping(self):
                 # Disable _all field to reduce index size.
                 '_all': {'enabled': False},
                 # Associate a page with a project.
-                '_parent': {'type': self._parent},
+                # '_parent': {'type': self._parent},
                 'properties': {
-                    'id': {'type': 'string', 'index': 'not_analyzed'},
-                    'sha': {'type': 'string', 'index': 'not_analyzed'},
-                    'project': {'type': 'string', 'index': 'not_analyzed'},
-                    'version': {'type': 'string', 'index': 'not_analyzed'},
-                    'path': {'type': 'string', 'index': 'not_analyzed'},
-                    'taxonomy': {'type': 'string', 'index': 'not_analyzed'},
-                    'commit': {'type': 'string', 'index': 'not_analyzed'},
-
-                    'title': {'type': 'string', 'analyzer': 'default_icu'},
-                    'headers': {'type': 'string', 'analyzer': 'default_icu'},
-                    'content': {'type': 'string', 'analyzer': 'default_icu'},
+                    'id': {'type': 'keyword'},
+                    'sha': {'type': 'keyword'},
+                    'project': {'type': 'keyword'},
+                    'version': {'type': 'keyword'},
+                    'path': {'type': 'keyword'},
+                    'taxonomy': {'type': 'keyword'},
+                    'commit': {'type': 'keyword'},
+
+                    'title': {'type': 'text', 'analyzer': 'default_icu'},
+                    'headers': {'type': 'text', 'analyzer': 'default_icu'},
+                    'content': {'type': 'text', 'analyzer': 'default_icu'},
                     # Add a weight field to enhance relevancy scoring.
                     'weight': {'type': 'float'},
                 }
@@ -321,7 +318,7 @@ def get_mapping(self):
                 # Disable _all field to reduce index size.
                 '_all': {'enabled': False},
                 # Associate a section with a page.
-                '_parent': {'type': self._parent},
+                # '_parent': {'type': self._parent},
                 # Commenting this out until we need it.
                 # 'suggest': {
                 #     "type": "completion",
@@ -330,18 +327,18 @@ def get_mapping(self):
                 #     "payloads": True,
                 # },
                 'properties': {
-                    'id': {'type': 'string', 'index': 'not_analyzed'},
-                    'project': {'type': 'string', 'index': 'not_analyzed'},
-                    'version': {'type': 'string', 'index': 'not_analyzed'},
-                    'path': {'type': 'string', 'index': 'not_analyzed'},
-                    'page_id': {'type': 'string', 'index': 'not_analyzed'},
-                    'commit': {'type': 'string', 'index': 'not_analyzed'},
-                    'title': {'type': 'string', 'analyzer': 'default_icu'},
-                    'content': {'type': 'string', 'analyzer': 'default_icu'},
+                    'id': {'type': 'keyword'},
+                    'project': {'type': 'keyword'},
+                    'version': {'type': 'keyword'},
+                    'path': {'type': 'keyword'},
+                    'page_id': {'type': 'keyword'},
+                    'commit': {'type': 'keyword'},
+                    'title': {'type': 'text', 'analyzer': 'default_icu'},
+                    'content': {'type': 'text', 'analyzer': 'default_icu'},
                     'blocks': {
                         'type': 'object',
                         'properties': {
-                            'code': {'type': 'string', 'analyzer': 'default_icu'}
+                            'code': {'type': 'text', 'analyzer': 'default_icu'}
                         }
                     },
                     # Add a weight field to enhance relevancy scoring.

diff --git a/readthedocs/settings/base.py b/readthedocs/settings/base.py
@@ -116,6 +116,7 @@ def INSTALLED_APPS(self):  # noqa
         if donate:
             apps.append('django_countries')
             apps.append('readthedocsext.donate')
+            apps.append('readthedocsext.search')
         return apps
 
     TEMPLATE_LOADERS = (

diff --git a/readthedocs/urls.py b/readthedocs/urls.py
@@ -86,9 +86,13 @@
 
 if 'readthedocsext.donate' in settings.INSTALLED_APPS:
     # Include donation URL's
-    groups.append([
-        url(r'^sustainability/', include('readthedocsext.donate.urls')),
-    ])
+    groups.insert(0,
+                  [url(r'^sustainability/', include('readthedocsext.donate.urls'))]
+                  )
+    for num, _url in enumerate(rtd_urls):
+        if _url and hasattr(_url, 'name') and _url.name == 'search':
+            rtd_urls[num] = \
+                url(r'^search/', 'readthedocsext.search.mainsearch.elastic_search', name='search')
 if not getattr(settings, 'USE_SUBDOMAIN', False) or settings.DEBUG:
     groups.insert(0, docs_urls)
 if getattr(settings, 'ALLOW_ADMIN', True):

diff --git a/requirements/pip.txt b/requirements/pip.txt
@@ -36,8 +36,7 @@ dnspython==1.15.0
 httplib2==0.7.7
 
 # Search
-elasticsearch==1.5.0
-pyelasticsearch==0.7.1
+elasticsearch==5.5.1
 pyquery==1.2.2
 
 # Utils