浏览代码

Use a separate page size for testing

Daoud Clarke 4 年之前
父节点
当前提交
c84eeba92e
共有 1 个文件被更改,包括 7 次插入7 次删除
  1. 7 7
      performance.py

+ 7 - 7
performance.py

@@ -1,23 +1,23 @@
 """
 """
 Test the performance of the search in terms of compression and speed.
 Test the performance of the search in terms of compression and speed.
 """
 """
-import json
-import numpy as np
 import os
 import os
 from datetime import datetime
 from datetime import datetime
 from itertools import islice
 from itertools import islice
 
 
+import numpy as np
 from spacy.lang.en import English
 from spacy.lang.en import English
 from starlette.testclient import TestClient
 from starlette.testclient import TestClient
 
 
-from app import app, complete
-from index import TinyIndexer, index_titles_and_urls, PAGE_SIZE, NUM_PAGES
+from app import app
+from index import TinyIndexer, index_titles_and_urls
 from paths import TEST_INDEX_PATH
 from paths import TEST_INDEX_PATH
 from wiki import get_wiki_titles_and_urls
 from wiki import get_wiki_titles_and_urls
 
 
-
 NUM_DOCUMENTS = 30000
 NUM_DOCUMENTS = 30000
 NUM_PAGES_FOR_STATS = 10
 NUM_PAGES_FOR_STATS = 10
+TEST_PAGE_SIZE = 512
+TEST_NUM_PAGES = 32
 
 
 
 
 def query_test():
 def query_test():
@@ -43,7 +43,7 @@ def query_test():
 
 
 def page_stats(indexer: TinyIndexer):
 def page_stats(indexer: TinyIndexer):
     page_sizes = []
     page_sizes = []
-    for i in range(NUM_PAGES):
+    for i in range(TEST_NUM_PAGES):
         page = indexer.get_page(i)
         page = indexer.get_page(i)
         if page is not None:
         if page is not None:
             page_sizes.append(len(page))
             page_sizes.append(len(page))
@@ -57,7 +57,7 @@ def performance_test():
         os.remove(TEST_INDEX_PATH)
         os.remove(TEST_INDEX_PATH)
     except FileNotFoundError:
     except FileNotFoundError:
         print("No test index found, creating")
         print("No test index found, creating")
-    with TinyIndexer(TEST_INDEX_PATH, NUM_PAGES, PAGE_SIZE) as indexer:
+    with TinyIndexer(TEST_INDEX_PATH, TEST_NUM_PAGES, TEST_PAGE_SIZE) as indexer:
         titles_and_urls = get_wiki_titles_and_urls()
         titles_and_urls = get_wiki_titles_and_urls()
         titles_and_urls_slice = islice(titles_and_urls, NUM_DOCUMENTS)
         titles_and_urls_slice = islice(titles_and_urls, NUM_DOCUMENTS)