diff --git a/.dockerignore b/.dockerignore deleted file mode 100644 index 98f39e7be..000000000 --- a/.dockerignore +++ /dev/null @@ -1,4 +0,0 @@ -data -results -*.bvecs -venv diff --git a/.github/workflows/benchmarks.yml b/.github/workflows/benchmarks.yml index cdd86dd47..1302e3311 100644 --- a/.github/workflows/benchmarks.yml +++ b/.github/workflows/benchmarks.yml @@ -1,61 +1,61 @@ -# Contributed by @GuilhemN in https://github.com/erikbern/ann-benchmarks/pull/233 -name: Billion-Scale ANN Benchmarks - -on: [push, pull_request] - -jobs: - build: - runs-on: ubuntu-latest - strategy: - matrix: - include: - - algorithm: faiss-ivf - library: faissconda - dataset: random-xs - - algorithm: faiss-t1 - dataset: random-xs - library: faissconda - - algorithm: faiss-t1 - dataset: random-range-xs - library: faissconda - - algorithm: diskann-t2 - dataset: random-xs - library: diskann - - algorithm: diskann-t2 - dataset: random-range-xs - library: diskann - - algorithm: httpann_example - dataset: random-xs - library: httpann_example - - algorithm: httpann_example - dataset: random-range-xs - library: httpann_example - fail-fast: false - - steps: - - uses: actions/checkout@v2 # Pull the repository - - - name: Set up Python 3.6 - uses: actions/setup-python@v2 - with: - python-version: 3.6 - - - name: Install dependencies - run: | - pip install -r requirements.txt - python install.py - env: - LIBRARY: ${{ matrix.library }} - DATASET: ${{ matrix.dataset }} - - - name: Run the benchmark - run: | - python create_dataset.py --dataset $DATASET - python run.py --algorithm $ALGORITHM --max-n-algorithms 2 --dataset $DATASET --timeout 600 - sudo chmod -R 777 results/ - python plot.py --dataset $DATASET --output plot.png - python data_export.py --output test.csv - - env: - ALGORITHM: ${{ matrix.algorithm}} - DATASET: ${{ matrix.dataset }} +# Contributed by @GuilhemN in https://github.com/erikbern/ann-benchmarks/pull/233 +name: Billion-Scale ANN Benchmarks + +on: [push, pull_request] + +jobs: + build: + runs-on: ubuntu-latest + strategy: + matrix: + include: + - algorithm: faiss-ivf + library: faissconda + dataset: random-xs + - algorithm: faiss-t1 + dataset: random-xs + library: faissconda + - algorithm: faiss-t1 + dataset: random-range-xs + library: faissconda + - algorithm: diskann-t2 + dataset: random-xs + library: diskann + - algorithm: diskann-t2 + dataset: random-range-xs + library: diskann + - algorithm: httpann_example + dataset: random-xs + library: httpann_example + - algorithm: httpann_example + dataset: random-range-xs + library: httpann_example + fail-fast: false + + steps: + - uses: actions/checkout@v2 # Pull the repository + + - name: Set up Python 3.6 + uses: actions/setup-python@v2 + with: + python-version: 3.6 + + - name: Install dependencies + run: | + pip install -r requirements.txt + python install.py + env: + LIBRARY: ${{ matrix.library }} + DATASET: ${{ matrix.dataset }} + + - name: Run the benchmark + run: | + python create_dataset.py --dataset $DATASET + python run.py --algorithm $ALGORITHM --max-n-algorithms 2 --dataset $DATASET --timeout 600 + sudo chmod -R 777 results/ + python plot.py --dataset $DATASET --output plot.png + python data_export.py --output test.csv + + env: + ALGORITHM: ${{ matrix.algorithm}} + DATASET: ${{ matrix.dataset }} diff --git a/GitHub_Logo_White.png b/GitHub_Logo_White.png new file mode 100644 index 000000000..c61ab9d05 Binary files /dev/null and b/GitHub_Logo_White.png differ diff --git a/LICENSE b/LICENSE deleted file mode 100644 index ef714baaa..000000000 --- a/LICENSE +++ /dev/null @@ -1,21 +0,0 @@ -MIT License - -Copyright (c) 2021 Martin Aumüller - -Permission is hereby granted, free of charge, to any person obtaining a copy -of this software and associated documentation files (the "Software"), to deal -in the Software without restriction, including without limitation the rights -to use, copy, modify, merge, publish, distribute, sublicense, and/or sell -copies of the Software, and to permit persons to whom the Software is -furnished to do so, subject to the following conditions: - -The above copyright notice and this permission notice shall be included in all -copies or substantial portions of the Software. - -THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR -IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, -FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE -AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER -LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, -OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE -SOFTWARE. diff --git a/MSFT-Turing-ANNS-terms.txt b/MSFT-Turing-ANNS-terms.txt deleted file mode 100644 index e413bfd7b..000000000 --- a/MSFT-Turing-ANNS-terms.txt +++ /dev/null @@ -1,21 +0,0 @@ -Release Terms for the Microsoft-Turing-ANNS dataset ---------------------------------------------------- - -The MS-Turing-ANNS datasets are intended for non-commercial research -purposes only to promote advancement in the field of artificial -intelligence and related areas, and is made available free of charge -without extending any license or other intellectual property -rights. The dataset is provided “as is” without warranty and usage of -the data has risks since we may not own the underlying rights in the -documents. We are not be liable for any damages related to use of the -dataset. Feedback is voluntarily given and can be used as we see -fit. Upon violation of any of these terms, your rights to use the -dataset will end automatically. - - -Disclaimer ----------- - -Data sets are intended for research and academic purposes. Please note -that inputs or outputs may include content that users find offensive, -shocking, and/or otherwise harmful. diff --git a/README.md b/README.md index 89754454b..e78c3ea52 100644 --- a/README.md +++ b/README.md @@ -1,77 +1,77 @@ -# Billion-Scale ANN - - - -## Install - -The only prerequisite is Python (tested with 3.6) and Docker. Works with newer versions of Python as well but probably requires an updated `requirements.txt` on the host. (Suggestion: copy `requirements.txt` to `requirements${PYTHON_VERSION}.txt` and remove all fixed versions. `requirements.txt` has to be kept for the docker containers.) - -1. Clone the repo. -2. Run `pip install -r requirements.txt` (Use `requirements_py38.txt` if you have Python 3.8.) -3. Install docker by following instructions [here](https://docs.docker.com/engine/install/ubuntu/). -You might also want to follow the post-install steps for running docker in non-root user mode. -3. Run `python install.py` to build all the libraries inside Docker containers. - -## Storing Data - -The framework assumes that all data is stored in `data/`. -Please use a symlink if your datasets and indices are supposed to be stored somewhere else. -The location of the linked folder matters a great deal for SSD-based search performance in T2. -A local SSD such as the one found on Azure Ls-series VMs is better than remote disks, even premium ones. -See [T1/T2](t1_t2/README.md) for more details. - -## Data sets - -See for details on the different datasets. - -### Dataset Preparation - -Before running experiments, datasets have to be downloaded. All preparation can be carried out by calling - -```python -python create_dataset.py --dataset [bigann-1B | deep-1B | text2image-1B | ssnpp-1B | msturing-1B | msspacev-1B] -``` - -Note that downloading the datasets can potentially take many hours. - -For local testing, there exist smaller random datasets `random-xs` and `random-range-xs`. -Furthermore, most datasets have 1M, 10M and 100M versions, run `python create_dataset -h` to get an overview. - - -## Running the benchmark - -Run `python run.py --dataset $DS --algorithm $ALGO` where `DS` is the dataset you are running on, -and `ALGO` is the name of the algorithm. (Use `python run.py --list-algorithms`) to get an overview. -`python run.py -h` provides you with further options. - -The parameters used by the implementation to build and query the index can be found in `algos.yaml`. - -## Running the track 1 baseline -After running the installation, we can evaluate the baseline as follows. - -```bash - -for DS in bigann-1B deep-1B text2image-1B ssnpp-1B msturing-1B msspacev-1B; -do - python run.py --dataset $DS --algorithm faiss-t1; -done -``` - -On a 28-core Xeon E5-2690 v4 that provided 100MB/s downloads, carrying out the baseline experiments took roughly 7 days. - -To evaluate the results, run -```bash -sudo chmod -R 777 results/ -python data_export.py --output res.csv -python3.8 eval/show_operating_points.py --algorithm faiss-t1 --threshold 10000 -``` - -## Including your algorithm and Evaluating the Results - -See [Track T1/T2](t1_t2/README.md) for more details on evaluation for Tracks T1 and T2. - -See [Track T3](t3/README.md) for more details on evaluation for Track T3. - -# Credits - -This project is a version of [ann-benchmarks](https://github.com/erikbern/ann-benchmarks) by [Erik Bernhardsson](https://erikbern.com/) and contributors targetting billion-scale datasets. +# Billion-Scale ANN + + + +## Install + +The only prerequisite is Python (tested with 3.6) and Docker. Works with newer versions of Python as well but probably requires an updated `requirements.txt` on the host. (Suggestion: copy `requirements.txt` to `requirements${PYTHON_VERSION}.txt` and remove all fixed versions. `requirements.txt` has to be kept for the docker containers.) + +1. Clone the repo. +2. Run `pip install -r requirements.txt` (Use `requirements_py38.txt` if you have Python 3.8.) +3. Install docker by following instructions [here](https://docs.docker.com/engine/install/ubuntu/). +You might also want to follow the post-install steps for running docker in non-root user mode. +3. Run `python install.py` to build all the libraries inside Docker containers. + +## Storing Data + +The framework assumes that all data is stored in `data/`. +Please use a symlink if your datasets and indices are supposed to be stored somewhere else. +The location of the linked folder matters a great deal for SSD-based search performance in T2. +A local SSD such as the one found on Azure Ls-series VMs is better than remote disks, even premium ones. +See [T1/T2](t1_t2/README.md) for more details. + +## Data sets + +See for details on the different datasets. + +### Dataset Preparation + +Before running experiments, datasets have to be downloaded. All preparation can be carried out by calling + +```python +python create_dataset.py --dataset [bigann-1B | deep-1B | text2image-1B | ssnpp-1B | msturing-1B | msspacev-1B] +``` + +Note that downloading the datasets can potentially take many hours. + +For local testing, there exist smaller random datasets `random-xs` and `random-range-xs`. +Furthermore, most datasets have 1M, 10M and 100M versions, run `python create_dataset -h` to get an overview. + + +## Running the benchmark + +Run `python run.py --dataset $DS --algorithm $ALGO` where `DS` is the dataset you are running on, +and `ALGO` is the name of the algorithm. (Use `python run.py --list-algorithms`) to get an overview. +`python run.py -h` provides you with further options. + +The parameters used by the implementation to build and query the index can be found in `algos.yaml`. + +## Running the track 1 baseline +After running the installation, we can evaluate the baseline as follows. + +```bash + +for DS in bigann-1B deep-1B text2image-1B ssnpp-1B msturing-1B msspacev-1B; +do + python run.py --dataset $DS --algorithm faiss-t1; +done +``` + +On a 28-core Xeon E5-2690 v4 that provided 100MB/s downloads, carrying out the baseline experiments took roughly 7 days. + +To evaluate the results, run +```bash +sudo chmod -R 777 results/ +python data_export.py --output res.csv +python3.8 eval/show_operating_points.py --algorithm faiss-t1 --threshold 10000 +``` + +## Including your algorithm and Evaluating the Results + +See [Track T1/T2](t1_t2/README.md) for more details on evaluation for Tracks T1 and T2. + +See [Track T3](t3/README.md) for more details on evaluation for Track T3. + +# Credits + +This project is a version of [ann-benchmarks](https://github.com/erikbern/ann-benchmarks) by [Erik Bernhardsson](https://erikbern.com/) and contributors targetting billion-scale datasets. diff --git a/algos.yaml b/algos.yaml deleted file mode 100644 index 47126a73f..000000000 --- a/algos.yaml +++ /dev/null @@ -1,594 +0,0 @@ -any: - faiss-ivf: - docker-tag: billion-scale-benchmark-faissconda - module: benchmark.algorithms.faiss_inmem - constructor: FaissIVF - base-args: ["@metric"] - run-groups: - base: - args: [[1024,2048,4096,8192]] - query-args: [[1, 5, 10, 50, 100, 200]] -random-range-xs: - faiss-t1: - docker-tag: billion-scale-benchmark-faissconda - module: benchmark.algorithms.faiss_t1 - constructor: Faiss - base-args: ["@metric"] - run-groups: - base: - # the following args show all build arguments that can be provided to the t1 baseline. - args: | - [{"indexkey": "OPQ32_128,IVF1024_HNSW32,PQ32", - "buildthreads": -1, - "by_residual": -1, - "add_bs": 100000000, - "two_level_clustering": true, - "quantizer_add_efSearch": 80, - "quantizer_efConstruction": 200, - "maxtrain": 100000000, - "clustering_niter": 25 - }] - query-args: | - ["nprobe=1,quantizer_efSearch=4", - "nprobe=2,quantizer_efSearch=4", - "nprobe=2,quantizer_efSearch=8", - "nprobe=4,quantizer_efSearch=4", - "nprobe=2,quantizer_efSearch=16"] - diskann-t2: - docker-tag: billion-scale-benchmark-diskann - module: benchmark.algorithms.diskann-t2 - constructor: Diskann - base-args: ["@metric"] - run-groups: - base: - args: | - [{"R":32, "L":32, "B":0.0001, "M":1}] - query-args: | - [{"Lmin":3, "Lmax":100, "BW":4, "T":16}] - diskann-v0_3-t2: - docker-tag: billion-scale-benchmark-diskann - module: benchmark.algorithms.diskann-v0_3 - constructor: Diskann - base-args: ["@metric"] - run-groups: - base: - args: | - [{"R":32, "L":32, "B":0.0001, "M":1}] - query-args: | - [{"Lmin":3, "Lmax":100, "BW":4, "T":16}] - httpann_example: - docker-tag: billion-scale-benchmark-httpann_example - module: benchmark.algorithms.httpann_example - constructor: HttpANNExampleAlgorithm - base-args: [ "@metric", "@dimension" ] - run-groups: - base: - args: - - [ 0.2, 0.4, 1.0 ] - query-args: [] -random-xs: - faiss-t1: - docker-tag: billion-scale-benchmark-faissconda - module: benchmark.algorithms.faiss_t1 - constructor: Faiss - base-args: ["@metric"] - run-groups: - base: - args: | - [{"indexkey": "OPQ32_128,IVF1024_HNSW32,PQ32" - }] - query-args: | - ["nprobe=1,quantizer_efSearch=4", - "nprobe=2,quantizer_efSearch=4", - "nprobe=2,quantizer_efSearch=8", - "nprobe=4,quantizer_efSearch=4", - "nprobe=2,quantizer_efSearch=16"] - diskann-t2: - docker-tag: billion-scale-benchmark-diskann - module: benchmark.algorithms.diskann-t2 - constructor: Diskann - base-args: ["@metric"] - run-groups: - base: - args: | - [{"R":32, "L":32, "B":0.0001, "M":1}] - query-args: | - [{"Ls":10, "BW":4, "T":16}] - diskann-v0_3-t2: - docker-tag: billion-scale-benchmark-diskann - module: benchmark.algorithms.diskann-v0_3 - constructor: Diskann - base-args: ["@metric"] - run-groups: - base: - args: | - [{"R":32, "L":32, "B":0.0001, "M":1}] - query-args: | - [{"Ls":10, "BW":4, "T":16}] - httpann_example: - docker-tag: billion-scale-benchmark-httpann_example - module: benchmark.algorithms.httpann_example - constructor: HttpANNExampleAlgorithm - base-args: [ "@metric", "@dimension" ] - run-groups: - base: - args: - - [ 0.2, 0.8, 1.0 ] - query-args: [ ] -deep-10M: - faiss-t1: - docker-tag: billion-scale-benchmark-faissconda - module: benchmark.algorithms.faiss_t1 - constructor: Faiss - base-args: ["@metric"] - run-groups: - base: - args: | - [{"indexkey": "OPQ32_128,IVF65536_HNSW32,PQ32" - }] - query-args: | - ["nprobe=1,quantizer_efSearch=4", - "nprobe=2,quantizer_efSearch=4", - "nprobe=2,quantizer_efSearch=8", - "nprobe=4,quantizer_efSearch=4", - "nprobe=2,quantizer_efSearch=16"] - diskann-t2: - docker-tag: billion-scale-benchmark-diskann - module: benchmark.algorithms.diskann-t2 - constructor: Diskann - base-args: ["@metric"] - run-groups: - base: - args: | - [{"R":100, "L":100, "B":0.3, "M":15}] - query-args: | - [{"Ls":50, "BW":4, "T":16}] -deep-1B: - faiss-t1: - docker-tag: billion-scale-benchmark-faissconda - module: benchmark.algorithms.faiss_t1 - constructor: Faiss - base-args: ["@metric"] - run-groups: - base: - args: | - [{"indexkey": "OPQ64_128,IVF1048576_HNSW32,PQ64x4fsr", - "url": "https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/track1_baseline_faiss/deep-1B.IVF1M_2level_PQ64x4fsr.faissindex" - }] - query-args: | - ["nprobe=1,quantizer_efSearch=4", - "nprobe=2,quantizer_efSearch=4", - "nprobe=2,quantizer_efSearch=8", - "nprobe=4,quantizer_efSearch=4", - "nprobe=2,quantizer_efSearch=16", - "nprobe=4,quantizer_efSearch=8", - "nprobe=4,quantizer_efSearch=16", - "nprobe=8,quantizer_efSearch=4", - "nprobe=8,quantizer_efSearch=8", - "nprobe=8,quantizer_efSearch=16", - "nprobe=8,quantizer_efSearch=32", - "nprobe=8,quantizer_efSearch=64", - "nprobe=16,quantizer_efSearch=8", - "nprobe=16,quantizer_efSearch=16", - "nprobe=16,quantizer_efSearch=32", - "nprobe=16,quantizer_efSearch=64", - "nprobe=16,quantizer_efSearch=128", - "nprobe=32,quantizer_efSearch=16", - "nprobe=32,quantizer_efSearch=32", - "nprobe=32,quantizer_efSearch=64", - "nprobe=32,quantizer_efSearch=128", - "nprobe=32,quantizer_efSearch=256", - "nprobe=64,quantizer_efSearch=16", - "nprobe=64,quantizer_efSearch=32", - "nprobe=64,quantizer_efSearch=64", - "nprobe=64,quantizer_efSearch=128", - "nprobe=64,quantizer_efSearch=256", - "nprobe=64,quantizer_efSearch=512", - "nprobe=128,quantizer_efSearch=32", - "nprobe=128,quantizer_efSearch=64", - "nprobe=128,quantizer_efSearch=128", - "nprobe=128,quantizer_efSearch=256", - "nprobe=128,quantizer_efSearch=512", - "nprobe=256,quantizer_efSearch=64", - "nprobe=256,quantizer_efSearch=128"] - diskann-t2: - docker-tag: billion-scale-benchmark-diskann - module: benchmark.algorithms.diskann-t2 - constructor: Diskann - base-args: ["@metric"] - run-groups: - base: - args: | - [{"R":100, "L":100, "B":50, "M":110, - "url": "https://comp21storage.blob.core.windows.net/publiccontainer/comp21/diskann-T2-baseline-indices/deep-1B/R100_L100_B50_M110" - }] - query-args: | - [{"Ls":30, "BW":4, "T":16}, - {"Ls":40, "BW":4, "T":16}, - {"Ls":50, "BW":4, "T":16}, - {"Ls":53, "BW":4, "T":16}, - {"Ls":56, "BW":4, "T":16}, - {"Ls":58, "BW":4, "T":16}, - {"Ls":60, "BW":4, "T":16}, - {"Ls":70, "BW":4, "T":16}, - {"Ls":80, "BW":4, "T":16}, - {"Ls":100, "BW":4, "T":16}] -msspacev-1B: - faiss-t1: - docker-tag: billion-scale-benchmark-faissconda - module: benchmark.algorithms.faiss_t1 - constructor: Faiss - base-args: ["@metric"] - run-groups: - base: - args: | - [{"indexkey": "OPQ64_128,IVF1048576_HNSW32,PQ64x4fsr", - "url": "https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/track1_baseline_faiss/msspacev-1B.IVF1M_2level_PQ64x4fsr.faissindex", - "query_bs": 4096 - }] - query-args: | - ["nprobe=1,quantizer_efSearch=4", - "nprobe=1,quantizer_efSearch=8", - "nprobe=1,quantizer_efSearch=16", - "nprobe=2,quantizer_efSearch=8", - "nprobe=2,quantizer_efSearch=16", - "nprobe=4,quantizer_efSearch=16", - "nprobe=4,quantizer_efSearch=32", - "nprobe=4,quantizer_efSearch=64", - "nprobe=8,quantizer_efSearch=32", - "nprobe=8,quantizer_efSearch=64", - "nprobe=16,quantizer_efSearch=32", - "nprobe=8,quantizer_efSearch=128", - "nprobe=16,quantizer_efSearch=64", - "nprobe=16,quantizer_efSearch=128", - "nprobe=32,quantizer_efSearch=64", - "nprobe=32,quantizer_efSearch=128", - "nprobe=32,quantizer_efSearch=256", - "nprobe=64,quantizer_efSearch=128", - "nprobe=64,quantizer_efSearch=256", - "nprobe=64,quantizer_efSearch=512", - "nprobe=128,quantizer_efSearch=128", - "nprobe=128,quantizer_efSearch=256", - "nprobe=128,quantizer_efSearch=512", - "nprobe=256,quantizer_efSearch=256", - "nprobe=256,quantizer_efSearch=512"] - diskann-t2: - docker-tag: billion-scale-benchmark-diskann - module: benchmark.algorithms.diskann-t2 - constructor: Diskann - base-args: ["@metric"] - run-groups: - base: - args: | - [{"R":100, "L":100, "B":47, "M":100, - "url": "https://comp21storage.blob.core.windows.net/publiccontainer/comp21/diskann-T2-baseline-indices/msspacev-1B/R100_L100_B47_M100" - }] - query-args: | - [{"Ls":40, "BW":4, "T":16}, - {"Ls":50, "BW":4, "T":16}, - {"Ls":60, "BW":4, "T":16}, - {"Ls":70, "BW":4, "T":16}, - {"Ls":80, "BW":4, "T":16}, - {"Ls":90, "BW":4, "T":16}, - {"Ls":100, "BW":4, "T":16}, - {"Ls":110, "BW":4, "T":16}, - {"Ls":120, "BW":4, "T":16}, - {"Ls":130, "BW":4, "T":16}] -msturing-1B: - faiss-t1: - docker-tag: billion-scale-benchmark-faissconda - module: benchmark.algorithms.faiss_t1 - constructor: Faiss - base-args: ["@metric"] - run-groups: - base: - args: | - [{"indexkey": "OPQ64_128,IVF1048576_HNSW32,PQ64x4fsr", - "url": "https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/track1_baseline_faiss/msturing-1B.IVF1M_2level_PQ64x4fsr.faissindex", - "query_bs": 4096 - }] - query-args: | - ["nprobe=1,quantizer_efSearch=4", - "nprobe=2,quantizer_efSearch=4", - "nprobe=1,quantizer_efSearch=8", - "nprobe=2,quantizer_efSearch=8", - "nprobe=1,quantizer_efSearch=16", - "nprobe=2,quantizer_efSearch=16", - "nprobe=4,quantizer_efSearch=16", - "nprobe=2,quantizer_efSearch=32", - "nprobe=4,quantizer_efSearch=32", - "nprobe=8,quantizer_efSearch=32", - "nprobe=8,quantizer_efSearch=64", - "nprobe=16,quantizer_efSearch=64", - "nprobe=16,quantizer_efSearch=128", - "nprobe=32,quantizer_efSearch=128", - "nprobe=32,quantizer_efSearch=256", - "nprobe=64,quantizer_efSearch=128", - "nprobe=64,quantizer_efSearch=256", - "nprobe=128,quantizer_efSearch=128", - "nprobe=64,quantizer_efSearch=512", - "nprobe=128,quantizer_efSearch=256", - "nprobe=128,quantizer_efSearch=512", - "nprobe=256,quantizer_efSearch=256", - "nprobe=256,quantizer_efSearch=512"] - diskann-t2: - docker-tag: billion-scale-benchmark-diskann - module: benchmark.algorithms.diskann-t2 - constructor: Diskann - base-args: ["@metric"] - run-groups: - base: - args: | - [{"R":100, "L":100, "B":50, "M":80, - "url": "https://comp21storage.blob.core.windows.net/publiccontainer/comp21/diskann-T2-baseline-indices/msturing-1B/R100_L100_B50_M80" - }] - query-args: | - [{"Ls":30, "BW":4, "T":16}, - {"Ls":40, "BW":4, "T":16}, - {"Ls":50, "BW":4, "T":16}, - {"Ls":55, "BW":4, "T":16}, - {"Ls":57, "BW":4, "T":16}, - {"Ls":59, "BW":4, "T":16}, - {"Ls":60, "BW":4, "T":16}, - {"Ls":70, "BW":4, "T":16}, - {"Ls":80, "BW":4, "T":16}, - {"Ls":100, "BW":4, "T":16}] -bigann-1B: - faiss-t1: - docker-tag: billion-scale-benchmark-faissconda - module: benchmark.algorithms.faiss_t1 - constructor: Faiss - base-args: ["@metric"] - run-groups: - base: - args: | - [{"indexkey": "OPQ64_128,IVF1048576_HNSW32,PQ64x4fsr", - "url": "https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/track1_baseline_faiss/bigann-1B.IVF1M_2level_PQ64x4fsr.faissindex" - }] - query-args: | - ["nprobe=1,quantizer_efSearch=4", - "nprobe=2,quantizer_efSearch=4", - "nprobe=4,quantizer_efSearch=4", - "nprobe=4,quantizer_efSearch=8", - "nprobe=8,quantizer_efSearch=4", - "nprobe=8,quantizer_efSearch=8", - "nprobe=8,quantizer_efSearch=16", - "nprobe=8,quantizer_efSearch=32", - "nprobe=16,quantizer_efSearch=16", - "nprobe=16,quantizer_efSearch=32", - "nprobe=16,quantizer_efSearch=64", - "nprobe=32,quantizer_efSearch=8", - "nprobe=32,quantizer_efSearch=32", - "nprobe=32,quantizer_efSearch=64", - "nprobe=32,quantizer_efSearch=128", - "nprobe=64,quantizer_efSearch=16", - "nprobe=64,quantizer_efSearch=32", - "nprobe=64,quantizer_efSearch=64", - "nprobe=64,quantizer_efSearch=128", - "nprobe=64,quantizer_efSearch=256", - "nprobe=128,quantizer_efSearch=32", - "nprobe=128,quantizer_efSearch=64", - "nprobe=128,quantizer_efSearch=128", - "nprobe=128,quantizer_efSearch=256", - "nprobe=128,quantizer_efSearch=512", - "nprobe=256,quantizer_efSearch=64", - "nprobe=256,quantizer_efSearch=128", - "nprobe=256,quantizer_efSearch=512"] - diskann-t2: - docker-tag: billion-scale-benchmark-diskann - module: benchmark.algorithms.diskann-t2 - constructor: Diskann - base-args: ["@metric"] - run-groups: - base: - args: | - [{"R":100, "L":100, "B":50, "M":80, - "url": "https://comp21storage.blob.core.windows.net/publiccontainer/comp21/diskann-T2-baseline-indices/bigann-1B/R100_L100_B50_M80" - }] - query-args: | - [{"Ls":30, "BW":4, "T":16}, - {"Ls":40, "BW":4, "T":16}, - {"Ls":50, "BW":4, "T":16}, - {"Ls":55, "BW":4, "T":16}, - {"Ls":60, "BW":4, "T":16}, - {"Ls":62, "BW":4, "T":16}, - {"Ls":65, "BW":4, "T":16}, - {"Ls":70, "BW":4, "T":16}, - {"Ls":80, "BW":4, "T":16}, - {"Ls":100, "BW":4, "T":16}] -ssnpp-1B: - faiss-t1: - docker-tag: billion-scale-benchmark-faissconda - module: benchmark.algorithms.faiss_t1 - constructor: Faiss - base-args: ["@metric"] - run-groups: - base: - args: | - [{"indexkey": "OPQ32_128,IVF1048576_HNSW32,PQ32", - "url": "https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/track1_baseline_faiss/ssnpp-1B.IVF1M_2level_PQ32.faissindex" - }] - query-args: | - ["nprobe=1,quantizer_efSearch=4,ht=92", - "nprobe=1,quantizer_efSearch=4,ht=98", - "nprobe=1,quantizer_efSearch=4,ht=104", - "nprobe=1,quantizer_efSearch=4,ht=112", - "nprobe=1,quantizer_efSearch=8,ht=96", - "nprobe=1,quantizer_efSearch=8,ht=108", - "nprobe=1,quantizer_efSearch=16,ht=98", - "nprobe=1,quantizer_efSearch=16,ht=114", - "nprobe=1,quantizer_efSearch=16,ht=116", - "nprobe=1,quantizer_efSearch=32,ht=98", - "nprobe=1,quantizer_efSearch=32,ht=110", - "nprobe=1,quantizer_efSearch=32,ht=112", - "nprobe=1,quantizer_efSearch=32,ht=120", - "nprobe=4,quantizer_efSearch=16,ht=256", - "nprobe=4,quantizer_efSearch=32,ht=104", - "nprobe=4,quantizer_efSearch=32,ht=112", - "nprobe=4,quantizer_efSearch=32,ht=256", - "nprobe=8,quantizer_efSearch=32,ht=112", - "nprobe=4,quantizer_efSearch=64,ht=256", - "nprobe=8,quantizer_efSearch=64,ht=116", - "nprobe=8,quantizer_efSearch=64,ht=128", - "nprobe=16,quantizer_efSearch=32,ht=256", - "nprobe=16,quantizer_efSearch=64,ht=118", - "nprobe=32,quantizer_efSearch=64,ht=256", - "nprobe=64,quantizer_efSearch=256,ht=116", - "nprobe=32,quantizer_efSearch=512,ht=256", - "nprobe=64,quantizer_efSearch=512,ht=126", - "nprobe=256,quantizer_efSearch=256,ht=128"] - diskann-t2: - docker-tag: billion-scale-benchmark-diskann - module: benchmark.algorithms.diskann-t2 - constructor: Diskann - base-args: ["@metric"] - run-groups: - base: - args: | - [{"R":100, "L":100, "B":60, "M":100, "C":500000, "CM":2, - "url": "https://comp21storage.blob.core.windows.net/publiccontainer/comp21/diskann-T2-baseline-indices/fbssnpp-1B/R100_L100_B60_M100" - }] - query-args: | - [{"Lmin":8, "Lmax":10000, "BW":4, "T":16}, - {"Lmin":12, "Lmax":10000, "BW":4, "T":16}, - {"Lmin":8, "Lmax":20000, "BW":4, "T":16}, - {"Lmin":12, "Lmax":20000, "BW":4, "T":16}, - {"Lmin":8, "Lmax":30000, "BW":4, "T":16}, - {"Lmin":12, "Lmax":30000, "BW":4, "T":16}, - {"Lmin":16, "Lmax":30000, "BW":4, "T":16}, - {"Lmin":8, "Lmax":45000, "BW":4, "T":16}, - {"Lmin":12, "Lmax":45000, "BW":4, "T":16}, - {"Lmin":16, "Lmax":45000, "BW":4, "T":16}] -text2image-1B: - faiss-t1: - docker-tag: billion-scale-benchmark-faissconda - module: benchmark.algorithms.faiss_t1 - constructor: Faiss - base-args: ["@metric"] - run-groups: - base: - args: | - [{"indexkey": "OPQ32_128,IVF1048576_HNSW32,PQ32", - "url": "https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/track1_baseline_faiss/text2image-1B.IVF1M_2level_PQ32.faissindex" - }] - # Trying all combinations of nprobe x efSearch - query-args: | - ["nprobe=1,quantizer_efSearch=4,ht=106", - "nprobe=1,quantizer_efSearch=16,ht=114", - "nprobe=1,quantizer_efSearch=16,ht=116", - "nprobe=2,quantizer_efSearch=16,ht=110", - "nprobe=4,quantizer_efSearch=8,ht=118", - "nprobe=4,quantizer_efSearch=32,ht=256", - "nprobe=8,quantizer_efSearch=16,ht=114", - "nprobe=4,quantizer_efSearch=64,ht=118", - "nprobe=4,quantizer_efSearch=64,ht=122", - "nprobe=8,quantizer_efSearch=32,ht=116", - "nprobe=8,quantizer_efSearch=64,ht=116", - "nprobe=8,quantizer_efSearch=64,ht=126", - "nprobe=16,quantizer_efSearch=64,ht=256", - "nprobe=16,quantizer_efSearch=256,ht=118", - "nprobe=16,quantizer_efSearch=512,ht=256", - "nprobe=32,quantizer_efSearch=512,ht=128", - "nprobe=64,quantizer_efSearch=128,ht=126", - "nprobe=128,quantizer_efSearch=512,ht=256", - "nprobe=256,quantizer_efSearch=512,ht=120", - "nprobe=256,quantizer_efSearch=512,ht=122"] - diskann-t2: - docker-tag: billion-scale-benchmark-diskann - module: benchmark.algorithms.diskann-t2 - constructor: Diskann - base-args: ["@metric"] - run-groups: - base: - args: | - [{"R":100, "L":100, "B":60, "M":115, "PQ":200, "C":500000, "CM":2, - "url": "https://comp21storage.blob.core.windows.net/publiccontainer/comp21/diskann-T2-baseline-indices/text2image-1B/R100_L100_B60_M115_PQ200" - }] - query-args: | - [{"Ls":10, "BW":10, "T":16}, - {"Ls":20, "BW":10, "T":16}, - {"Ls":30, "BW":10, "T":16}, - {"Ls":40, "BW":10, "T":16}, - {"Ls":50, "BW":10, "T":16}, - {"Ls":60, "BW":10, "T":16}, - {"Ls":70, "BW":10, "T":16}, - {"Ls":80, "BW":10, "T":16}, - {"Ls":90, "BW":10, "T":16}, - {"Ls":100, "BW":10, "T":16}] -ssnpp-10M: - faiss-t1: - docker-tag: billion-scale-benchmark-faissconda - module: benchmark.algorithms.faiss_t1 - constructor: Faiss - base-args: ["@metric"] - run-groups: - base: - args: | - [{"indexkey": "OPQ32_128,IVF65536_HNSW32,PQ32" - }] - query-args: | - ["nprobe=1,quantizer_efSearch=4,ht=92", - "nprobe=1,quantizer_efSearch=4,ht=98", - "nprobe=1,quantizer_efSearch=4,ht=104", - "nprobe=1,quantizer_efSearch=4,ht=112"] -bigann-10M: - diskann-t2: - docker-tag: billion-scale-benchmark-diskann - module: benchmark.algorithms.diskann-t2 - constructor: Diskann - base-args: ["@metric"] - run-groups: - base: - args: | - [{"R":100, "L":100, "B":0.3, "M":15}] - query-args: | - [{"Ls":50, "BW":4, "T":16}] - -msturing-1M: - diskann-t2: - docker-tag: billion-scale-benchmark-diskann - module: benchmark.algorithms.diskann-t2 - constructor: Diskann - base-args: ["@metric"] - run-groups: - base: - args: | - [{"R":50, "L":50, "B":0.03, "M":1}] - query-args: | - [{"Ls":50, "BW":4, "T":16}] -msspacev-1M: - diskann-t2: - docker-tag: billion-scale-benchmark-diskann - module: benchmark.algorithms.diskann-t2 - constructor: Diskann - base-args: ["@metric"] - run-groups: - base: - args: | - [{"R":50, "L":50, "B":0.03, "M":1}] - query-args: | - [{"Ls":50, "BW":4, "T":16}] -text2image-1M: - diskann-t2: - docker-tag: billion-scale-benchmark-diskann - module: benchmark.algorithms.diskann-t2 - constructor: Diskann - base-args: ["@metric"] - run-groups: - base: - args: | - [{"R":50, "L":50, "B":0.03, "M":1, "PQ":200}] - query-args: | - [{"Ls":50, "BW":4, "T":16}] -text2image-10M: - diskann-t2: - docker-tag: billion-scale-benchmark-diskann - module: benchmark.algorithms.diskann-t2 - constructor: Diskann - base-args: ["@metric"] - run-groups: - base: - args: | - [{"R":50, "L":50, "B":0.3, "M":10, "PQ":200}] - query-args: | - [{"Ls":50, "BW":4, "T":16}] diff --git a/assets/aws_logo.png b/assets/aws_logo.png new file mode 100644 index 000000000..06df0852f Binary files /dev/null and b/assets/aws_logo.png differ diff --git a/assets/cmt_logo.png b/assets/cmt_logo.png new file mode 100644 index 000000000..4ad6a8404 Binary files /dev/null and b/assets/cmt_logo.png differ diff --git a/assets/discord_logo.png b/assets/discord_logo.png new file mode 100644 index 000000000..254977f0b Binary files /dev/null and b/assets/discord_logo.png differ diff --git a/assets/github_logo.png b/assets/github_logo.png new file mode 100644 index 000000000..7356d06ed Binary files /dev/null and b/assets/github_logo.png differ diff --git a/assets/github_logo_white.png b/assets/github_logo_white.png new file mode 100644 index 000000000..09cb6cc0b Binary files /dev/null and b/assets/github_logo_white.png differ diff --git a/assets/microsoft_logo.png b/assets/microsoft_logo.png new file mode 100644 index 000000000..315a95007 Binary files /dev/null and b/assets/microsoft_logo.png differ diff --git a/assets/og.png b/assets/og.png new file mode 100644 index 000000000..436c4c482 Binary files /dev/null and b/assets/og.png differ diff --git a/assets/organizers/amir-ingber.png b/assets/organizers/amir-ingber.png new file mode 100644 index 000000000..b895c1ff1 Binary files /dev/null and b/assets/organizers/amir-ingber.png differ diff --git a/assets/organizers/dmitry-baranchuk.png b/assets/organizers/dmitry-baranchuk.png new file mode 100644 index 000000000..ae807f3c3 Binary files /dev/null and b/assets/organizers/dmitry-baranchuk.png differ diff --git a/assets/organizers/edo-liberty.png b/assets/organizers/edo-liberty.png new file mode 100644 index 000000000..f2911ee4d Binary files /dev/null and b/assets/organizers/edo-liberty.png differ diff --git a/assets/organizers/frank-liu.png b/assets/organizers/frank-liu.png new file mode 100644 index 000000000..41d8334cb Binary files /dev/null and b/assets/organizers/frank-liu.png differ diff --git a/assets/organizers/george-williams.png b/assets/organizers/george-williams.png new file mode 100644 index 000000000..3de8649f7 Binary files /dev/null and b/assets/organizers/george-williams.png differ diff --git a/assets/organizers/harsha-simhadri.png b/assets/organizers/harsha-simhadri.png new file mode 100644 index 000000000..626f6420f Binary files /dev/null and b/assets/organizers/harsha-simhadri.png differ diff --git "a/assets/organizers/martin-aum\303\274ller.png" "b/assets/organizers/martin-aum\303\274ller.png" new file mode 100644 index 000000000..a1deecbbc Binary files /dev/null and "b/assets/organizers/martin-aum\303\274ller.png" differ diff --git a/assets/organizers/matthijs-douze.png b/assets/organizers/matthijs-douze.png new file mode 100644 index 000000000..c0f6d8161 Binary files /dev/null and b/assets/organizers/matthijs-douze.png differ diff --git a/assets/pinecone-logo.svg b/assets/pinecone-logo.svg new file mode 100644 index 000000000..4f2753237 --- /dev/null +++ b/assets/pinecone-logo.svg @@ -0,0 +1,36 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/assets/zilliz-logo.png b/assets/zilliz-logo.png new file mode 100644 index 000000000..8b66a559e Binary files /dev/null and b/assets/zilliz-logo.png differ diff --git a/benchmark/__init__.py b/benchmark/__init__.py deleted file mode 100644 index c3961685a..000000000 --- a/benchmark/__init__.py +++ /dev/null @@ -1 +0,0 @@ -from __future__ import absolute_import diff --git a/benchmark/algorithms/base.py b/benchmark/algorithms/base.py deleted file mode 100644 index 903903b14..000000000 --- a/benchmark/algorithms/base.py +++ /dev/null @@ -1,113 +0,0 @@ -from __future__ import absolute_import -import psutil - -class BaseANN(object): - def done(self): - """ - This is called after results have been processed. - Use it for cleaning up if necessary. - """ - pass - - def track(self): - """ - return "T1" if submitting an entry for track 1 - return "T2" if submitting an entry for track 2 - return "T3" if submitting an entry for track 3 - """ - raise NotImplementedError() - - def fit(self, dataset): - """ - Build the index for the data points given in dataset name. - Assumes that after fitting index is loaded in memory. - """ - raise NotImplementedError() - - def load_index(self, dataset): - """ - Load the index for dataset. Returns False if index - is not available, True otherwise. - - Checking the index usually involves the dataset name - and the index build paramters passed during construction. - """ - raise NotImplementedError() - - def index_files_to_store(self, dataset): - """ - Specify a triplet with the local directory path of index files, - the common prefix name of index component(s) and a list of - index components that need to be uploaded to (after build) - or downloaded from (for search) cloud storage. - - For local directory path under docker environment, please use - a directory under - data/indices/track(T1 or T2)/algo.__str__()/DATASETS[dataset]().short_name() - """ - raise NotImplementedError() - - def query(self, X, k): - """Carry out a batch query for k-NN of query set X.""" - raise NotImplementedError() - - def range_query(self, X, radius): - """ - Carry out a batch query for range search with - radius. - """ - raise NotImplementedError() - - def get_results(self): - """ - Helper method to convert query results of k-NN search. - If there are nq queries, returns a (nq, k) array of integers - representing the indices of the k-NN for each query. - """ - return self.res - - def get_range_results(self): - """ - Helper method to convert query results of range search. - If there are nq queries, returns a triple lims, D, I. - lims is a (nq) array, such that - - I[lims[q]:lims[q + 1]] in int - - are the indices of the indices of the range results of query q, and - - D[lims[q]:lims[q + 1]] in float - - are the distances. - """ - return self.res - - def get_additional(self): - """ - Retrieve additional results. - Return a dictionary with metrics - and corresponding measured values. - - The following additional metrics are supported: - - `mean_latency` in microseconds, if this applies to your algorithm. - Skip if your algorithm batches query processing. - - `latency_999` is the 99.9pc latency in microseconds, if this applies - to your algorithm. Skip if your algorithm batches query processing. - - `dist_comps` is the total number of points in the base set - to which a query was compared. - - `mean_ssd_ios` is the average number of SSD I/Os per query for T2 algorithms. - """ - return {} - - def __str__(self): - return self.name - - def get_memory_usage(self): - """Return the current memory usage of this algorithm instance - (in kilobytes), or None if this information is not available.""" - # return in kB for backwards compatibility - return psutil.Process().memory_info().rss / 1024 diff --git a/benchmark/algorithms/definitions.py b/benchmark/algorithms/definitions.py deleted file mode 100644 index 836282bc7..000000000 --- a/benchmark/algorithms/definitions.py +++ /dev/null @@ -1,179 +0,0 @@ -from __future__ import absolute_import -from os import sep as pathsep -import collections -import importlib -import os -import sys -import traceback -import yaml -import json -from enum import Enum -from itertools import product - - -Definition = collections.namedtuple( - 'Definition', - ['algorithm', 'constructor', 'module', 'docker_tag', - 'arguments', 'query_argument_groups', 'disabled']) - - -def instantiate_algorithm(definition): - print('Trying to instantiate %s.%s(%s)' % - (definition.module, definition.constructor, definition.arguments)) - module = importlib.import_module(definition.module) - constructor = getattr(module, definition.constructor) - return constructor(*definition.arguments) - - -class InstantiationStatus(Enum): - AVAILABLE = 0 - NO_CONSTRUCTOR = 1 - NO_MODULE = 2 - - -def algorithm_status(definition): - try: - module = importlib.import_module(definition.module) - if hasattr(module, definition.constructor): - return InstantiationStatus.AVAILABLE - else: - return InstantiationStatus.NO_CONSTRUCTOR - except ImportError: - return InstantiationStatus.NO_MODULE - - -def _generate_combinations(args): - if isinstance(args, list): - args = [el if isinstance(el, list) else [el] for el in args] - return [list(x) for x in product(*args)] - elif isinstance(args, dict): - flat = [] - for k, v in args.items(): - if isinstance(v, list): - flat.append([(k, el) for el in v]) - else: - flat.append([(k, v)]) - return [dict(x) for x in product(*flat)] - elif isinstance(args, str): - l = json.loads(args.strip()) - return l - else: - raise TypeError("No args handling exists for %s" % type(args).__name__) - - -def _substitute_variables(arg, vs): - if isinstance(arg, dict): - return dict([(k, _substitute_variables(v, vs)) - for k, v in arg.items()]) - elif isinstance(arg, list): - return [_substitute_variables(a, vs) for a in arg] - elif isinstance(arg, str) and arg in vs: - return vs[arg] - else: - return arg - - -def _get_definitions(definition_file): - with open(definition_file, "r") as f: - return yaml.load(f, yaml.SafeLoader) - - -def list_algorithms(definition_file): - definitions = _get_definitions(definition_file) - - print('The following algorithms are supported...') - for point in definitions: - print('\t... for the point type "%s"...' % point) - for metric in definitions[point]: - print('\t\t... and the distance metric "%s":' % metric) - for algorithm in definitions[point][metric]: - print('\t\t\t%s' % algorithm) - - -def get_unique_algorithms(definition_file): - definitions = _get_definitions(definition_file) - algos = set() - for point in definitions: - for metric in definitions[point]: - for algorithm in definitions[point][metric]: - algos.add(algorithm) - return list(sorted(algos)) - - -def get_definitions(definition_file, dimension, dataset, - distance_metric="euclidean", count=10): - - definitions = _get_definitions(definition_file) - - algorithm_definitions = {} - if "any" in definitions: - algorithm_definitions.update(definitions["any"]) - if dataset in definitions: - algorithm_definitions.update(definitions[dataset]) - - definitions = [] - for (name, algo) in algorithm_definitions.items(): - for k in ['docker-tag', 'module', 'constructor']: - if k not in algo: - raise Exception( - 'algorithm %s does not define a "%s" property' % (name, k)) - - base_args = [] - if "base-args" in algo: - base_args = algo["base-args"] - - for run_group in algo["run-groups"].values(): - if "arg-groups" in run_group: - groups = [] - for arg_group in run_group["arg-groups"]: - if isinstance(arg_group, dict): - # Dictionaries need to be expanded into lists in order - # for the subsequent call to _generate_combinations to - # do the right thing - groups.append(_generate_combinations(arg_group)) - else: - groups.append(arg_group) - args = _generate_combinations(groups) - elif "args" in run_group: - args = _generate_combinations(run_group["args"]) - else: - assert False, "? what? %s" % run_group - - if "query-arg-groups" in run_group: - groups = [] - for arg_group in run_group["query-arg-groups"]: - if isinstance(arg_group, dict): - groups.append(_generate_combinations(arg_group)) - else: - groups.append(arg_group) - query_args = _generate_combinations(groups) - elif "query-args" in run_group: - query_args = _generate_combinations(run_group["query-args"]) - else: - query_args = [] - - for arg_group in args: - aargs = [] - aargs.extend(base_args) - if isinstance(arg_group, list): - aargs.extend(arg_group) - else: - aargs.append(arg_group) - - vs = { - "@count": count, - "@metric": distance_metric, - "@dimension": dimension - } - aargs = [_substitute_variables(arg, vs) for arg in aargs] - definitions.append(Definition( - algorithm=name, - docker_tag=algo['docker-tag'], - module=algo['module'], - constructor=algo['constructor'], - arguments=aargs, - query_argument_groups=query_args, - disabled=algo.get('disabled', False) - )) - - return definitions diff --git a/benchmark/algorithms/diskann-t2.py b/benchmark/algorithms/diskann-t2.py deleted file mode 100755 index 24daaa023..000000000 --- a/benchmark/algorithms/diskann-t2.py +++ /dev/null @@ -1,222 +0,0 @@ -from __future__ import absolute_import -import psutil -import os -import time -import numpy as np -import diskannpy - -from benchmark.algorithms.base import BaseANN -from benchmark.datasets import DATASETS, download_accelerated - -class Diskann(BaseANN): - def __init__(self, metric, index_params): - self.name = "DiskANN" - if (index_params.get("R")==None): - print("Error: missing parameter R") - return - if (index_params.get("L")==None): - print("Error: missing parameter L") - return - if (index_params.get("B")==None): - print("Error: missing parameter B") - return - if(index_params.get("M")==None): - print("Error: missing parameter M") - return - - self._index_params = index_params - self._metric = metric - - self.R = index_params.get("R") - self.L = index_params.get("L") - self.B = index_params.get("B") - self.M = index_params.get("M") - self.PQ = 0 if index_params.get("PQ") == None else index_params.get("PQ") - self.C = -1 if index_params.get("C") == None else index_params.get("C") - self.cache_mechanism = 1 if index_params.get("CM") == None else index_params.get("CM") - if self.C == 0: - self.cache_mechanism = 0 - print(self.PQ) - - def track(self): - return "T2" - - def index_name(self): - if self.PQ == 0: - return f"R{self.R}_L{self.L}_B{self.B}_M{self.M}" - else: - return f"R{self.R}_L{self.L}_B{self.B}_M{self.M}_PQ{self.PQ}" - - def create_index_dir(self, dataset): - index_dir = os.path.join(os.getcwd(), "data", "indices") - os.makedirs(index_dir, mode=0o777, exist_ok=True) - index_dir = os.path.join(index_dir, "T2") - os.makedirs(index_dir, mode=0o777, exist_ok=True) - index_dir = os.path.join(index_dir, self.__str__()) - os.makedirs(index_dir, mode=0o777, exist_ok=True) - index_dir = os.path.join(index_dir, dataset.short_name()) - os.makedirs(index_dir, mode=0o777, exist_ok=True) - index_dir = os.path.join(index_dir, self.index_name()) - os.makedirs(index_dir, mode=0o777, exist_ok=True) - return index_dir - - def fit(self, dataset): - """ - Build the index for the data points given in dataset name. - """ - - ds = DATASETS[dataset]() - d = ds.d - - buildthreads = self._index_params.get("buildthreads", -1) - if buildthreads == -1: - buildthreads = diskannpy.omp_get_max_threads() - - print("Set build-time number of threads:", buildthreads) - diskannpy.omp_set_num_threads(buildthreads) - - index_dir = self.create_index_dir(ds) - self.index_path = os.path.join(index_dir, self.index_name()) - - if ds.distance() == "euclidean": - metric = diskannpy.L2 - elif ds.distance() == "ip": - metric = diskannpy.INNER_PRODUCT - else: - print("Unsuported distance function.") - return False - - - if not hasattr(self, 'index'): - if ds.dtype == "float32": - self.index = diskannpy.DiskANNFloatIndex(metric) - elif ds.dtype == "int8": - self.index = diskannpy.DiskANNInt8Index(metric) - elif ds.dtype == "uint8": - self.index = diskannpy.DiskANNUInt8Index(metric) - else: - print ("Unsupported data type.") - return False - - start = time.time() - if self.PQ > 0: - self.index.build(ds.get_dataset_fn(), self.index_path, self.R, self.L, self.B, self.M, buildthreads, self.PQ) - else: - self.index.build(ds.get_dataset_fn(), self.index_path, self.R, self.L, self.B, self.M, buildthreads) - end = time.time() - print("DiskANN index built in %.3f s" % (end - start)) - - - if self.C > 0: - num_nodes_to_cache = self.C - else: - num_nodes_to_cache = int(ds.nb/1000) if ds.nb > 1000000 else int(ds.nb/100) - print(f"Loading index and caching {num_nodes_to_cache} nodes..") - self.index.load_index(self.index_path, diskannpy.omp_get_max_threads(), num_nodes_to_cache, self.cache_mechanism) - - def get_index_components(self, dataset): - index_components = [ - '_pq_pivots.bin', '_pq_pivots.bin_centroid.bin', '_pq_pivots.bin_chunk_offsets.bin', - '_pq_pivots.bin_rearrangement_perm.bin', '_sample_data.bin', '_sample_ids.bin', - '_pq_compressed.bin', '_disk.index' - ] - ds = DATASETS[dataset]() - if ds.distance() == "ip": - index_components = index_components + [ - '_disk.index_centroids.bin', '_disk.index_max_base_norm.bin', '_disk.index_medoids.bin' - ] - if self.PQ > 0: - index_components = index_components + [ - '_disk.index_pq_pivots.bin', '_disk.index_pq_pivots.bin_centroid.bin', - '_disk.index_pq_pivots.bin_chunk_offsets.bin', '_disk.index_pq_pivots.bin_rearrangement_perm.bin' - ] - return index_components - - def index_files_to_store(self, dataset): - return [self.create_index_dir(DATASETS[dataset]()), self.index_name(), self.get_index_components(dataset)] - - def load_index(self, dataset): - """ - Load the index for dataset. Returns False if index - is not available, True otherwise. - - Checking the index usually involves the dataset name - and the index build paramters passed during construction. - """ - ds = DATASETS[dataset]() - if ds.distance() == "euclidean": - metric = diskannpy.L2 - elif ds.distance() == "ip": - metric = diskannpy.INNER_PRODUCT - else: - print("Unsuported distance function.") - return False - - if ds.dtype == "float32": - self.index = diskannpy.DiskANNFloatIndex(metric) - elif ds.dtype == "int8": - self.index = diskannpy.DiskANNInt8Index(metric) - elif ds.dtype == "uint8": - self.index = diskannpy.DiskANNUInt8Index(metric) - else: - print ("Unsupported data type.") - return False - - index_dir = self.create_index_dir(ds) - if not (os.path.exists(index_dir)) and 'url' not in self._index_params: - return False - - index_path = os.path.join(index_dir, self.index_name()) - index_components = self.get_index_components(dataset) - - for component in index_components: - index_file = index_path + component - if not (os.path.exists(index_file)): - if 'url' in self._index_params: - index_file_source = self._index_params['url'] + '/' + self.index_name() + component - print(f"Downloading index in background. This can take a while.") - download_accelerated(index_file_source, index_file, quiet=True) - else: - return False - - print("Loading index") - - if self.C > 0: - num_nodes_to_cache = self.C - else: - num_nodes_to_cache = int(ds.nb/1000) if ds.nb > 1000000 else int(ds.nb/100) - if (self.index.load_index(index_path, diskannpy.omp_get_max_threads(), num_nodes_to_cache, self.cache_mechanism) == 0): - print ("Load index success.") - return True - else: - return False - - def query(self, X, k): - """Carry out a batch query for k-NN of query set X.""" - nq, dim = (np.shape(X)) - [self.res, self.query_dists], self.stats = self.index.batch_search_numpy_input(X, dim, nq, k, self.Ls, self.BW, self.threads) - self.stats["dist_comps"] = self.stats["mean_dist_comps"] * nq - - def range_query(self, X, radius): - """ - Carry out a batch query for range search with - radius. - """ - nq, dim = np.shape(X) - [self.rangeres_lim, [self.rangeres_ids, self.rangeres_dists]], self.stats = self.index.batch_range_search_numpy_input( - X, dim, nq, radius, self.Lmin, self.Lmax, self.BW, self.threads) - self.stats["dist_comps"] = self.stats["mean_dist_comps"] * nq - - def get_range_results(self): - return (self.rangeres_lim, self.rangeres_dists, self.rangeres_ids) - - def get_additional(self): - return self.stats - - def set_query_arguments(self, query_args): - self._query_args = query_args - self.Ls = 0 if query_args.get("Ls") == None else query_args.get("Ls") - self.Lmin = 0 if query_args.get("Lmin") == None else query_args.get("Lmin") - self.Lmax = 0 if query_args.get("Lmax") == None else query_args.get("Lmax") - self.BW = self._query_args.get("BW") - self.threads = self._query_args.get("T") diff --git a/benchmark/algorithms/diskann-v0_3.py b/benchmark/algorithms/diskann-v0_3.py deleted file mode 100644 index d1b7e0281..000000000 --- a/benchmark/algorithms/diskann-v0_3.py +++ /dev/null @@ -1,222 +0,0 @@ -from __future__ import absolute_import -import psutil -import os -import time -import numpy as np -import diskannpy - -from benchmark.algorithms.base import BaseANN -from benchmark.datasets import DATASETS, download_accelerated - -class Diskann(BaseANN): - def __init__(self, metric, index_params): - self.name = "DiskANN-v0.3" - if (index_params.get("R")==None): - print("Error: missing parameter R") - return - if (index_params.get("L")==None): - print("Error: missing parameter L") - return - if (index_params.get("B")==None): - print("Error: missing parameter B") - return - if(index_params.get("M")==None): - print("Error: missing parameter M") - return - - self._index_params = index_params - self._metric = metric - - self.R = index_params.get("R") - self.L = index_params.get("L") - self.B = index_params.get("B") - self.M = index_params.get("M") - self.PQ = 0 if index_params.get("PQ") == None else index_params.get("PQ") - self.C = -1 if index_params.get("C") == None else index_params.get("C") - self.cache_mechanism = 1 if index_params.get("CM") == None else index_params.get("CM") - if self.C == 0: - self.cache_mechanism = 0 - print(self.PQ) - - def track(self): - return "T2" - - def index_name(self): - if self.PQ == 0: - return f"R{self.R}_L{self.L}_B{self.B}_M{self.M}" - else: - return f"R{self.R}_L{self.L}_B{self.B}_M{self.M}_PQ{self.PQ}" - - def create_index_dir(self, dataset): - index_dir = os.path.join(os.getcwd(), "data", "indices") - os.makedirs(index_dir, mode=0o777, exist_ok=True) - index_dir = os.path.join(index_dir, "T2") - os.makedirs(index_dir, mode=0o777, exist_ok=True) - index_dir = os.path.join(index_dir, self.__str__()) - os.makedirs(index_dir, mode=0o777, exist_ok=True) - index_dir = os.path.join(index_dir, dataset.short_name()) - os.makedirs(index_dir, mode=0o777, exist_ok=True) - index_dir = os.path.join(index_dir, self.index_name()) - os.makedirs(index_dir, mode=0o777, exist_ok=True) - return index_dir - - def fit(self, dataset): - """ - Build the index for the data points given in dataset name. - """ - - ds = DATASETS[dataset]() - d = ds.d - - buildthreads = self._index_params.get("buildthreads", -1) - if buildthreads == -1: - buildthreads = diskannpy.omp_get_max_threads() - - print("Set build-time number of threads:", buildthreads) - diskannpy.omp_set_num_threads(buildthreads) - - index_dir = self.create_index_dir(ds) - self.index_path = os.path.join(index_dir, self.index_name()) - - if ds.distance() == "euclidean": - metric = diskannpy.L2 - elif ds.distance() == "ip": - metric = diskannpy.INNER_PRODUCT - else: - print("Unsuported distance function.") - return False - - - if not hasattr(self, 'index'): - if ds.dtype == "float32": - self.index = diskannpy.DiskANNFloatIndex(metric) - elif ds.dtype == "int8": - self.index = diskannpy.DiskANNInt8Index(metric) - elif ds.dtype == "uint8": - self.index = diskannpy.DiskANNUInt8Index(metric) - else: - print ("Unsupported data type.") - return False - - start = time.time() - if self.PQ > 0: - self.index.build(ds.get_dataset_fn(), self.index_path, self.R, self.L, self.B, self.M, buildthreads, self.PQ) - else: - self.index.build(ds.get_dataset_fn(), self.index_path, self.R, self.L, self.B, self.M, buildthreads) - end = time.time() - print("DiskANN index built in %.3f s" % (end - start)) - - - if self.C > 0: - num_nodes_to_cache = self.C - else: - num_nodes_to_cache = int(ds.nb/1000) if ds.nb > 1000000 else int(ds.nb/100) - print(f"Loading index and caching {num_nodes_to_cache} nodes..") - self.index.load_index(self.index_path, diskannpy.omp_get_max_threads(), num_nodes_to_cache, self.cache_mechanism) - - def get_index_components(self, dataset): - index_components = [ - '_pq_pivots.bin', '_pq_pivots.bin_centroid.bin', '_pq_pivots.bin_chunk_offsets.bin', - '_pq_pivots.bin_rearrangement_perm.bin', '_sample_data.bin', '_sample_ids.bin', - '_pq_compressed.bin', '_disk.index', '_disk.index_medoids.bin' - ] - ds = DATASETS[dataset]() - if ds.distance() == "ip": - index_components = index_components + [ - '_disk.index_centroids.bin', '_disk.index_max_base_norm.bin', '_disk.index_medoids.bin' - ] - if self.PQ > 0: - index_components = index_components + [ - '_disk.index_pq_pivots.bin', '_disk.index_pq_pivots.bin_centroid.bin', - '_disk.index_pq_pivots.bin_chunk_offsets.bin', '_disk.index_pq_pivots.bin_rearrangement_perm.bin' - ] - return index_components - - def index_files_to_store(self, dataset): - return [self.create_index_dir(DATASETS[dataset]()), self.index_name(), self.get_index_components(dataset)] - - def load_index(self, dataset): - """ - Load the index for dataset. Returns False if index - is not available, True otherwise. - - Checking the index usually involves the dataset name - and the index build paramters passed during construction. - """ - ds = DATASETS[dataset]() - if ds.distance() == "euclidean": - metric = diskannpy.L2 - elif ds.distance() == "ip": - metric = diskannpy.INNER_PRODUCT - else: - print("Unsuported distance function.") - return False - - if ds.dtype == "float32": - self.index = diskannpy.DiskANNFloatIndex(metric) - elif ds.dtype == "int8": - self.index = diskannpy.DiskANNInt8Index(metric) - elif ds.dtype == "uint8": - self.index = diskannpy.DiskANNUInt8Index(metric) - else: - print ("Unsupported data type.") - return False - - index_dir = self.create_index_dir(ds) - if not (os.path.exists(index_dir)) and 'url' not in self._index_params: - return False - - index_path = os.path.join(index_dir, self.index_name()) - index_components = self.get_index_components(dataset) - - for component in index_components: - index_file = index_path + component - if not (os.path.exists(index_file)): - if 'url' in self._index_params: - index_file_source = self._index_params['url'] + '/' + self.index_name() + component - print(f"Downloading index in background. This can take a while.") - download_accelerated(index_file_source, index_file, quiet=True) - else: - return False - - print("Loading index") - - if self.C > 0: - num_nodes_to_cache = self.C - else: - num_nodes_to_cache = int(ds.nb/1000) if ds.nb > 1000000 else int(ds.nb/100) - if (self.index.load_index(index_path, diskannpy.omp_get_max_threads(), num_nodes_to_cache, self.cache_mechanism) == 0): - print ("Load index success.") - return True - else: - return False - - def query(self, X, k): - """Carry out a batch query for k-NN of query set X.""" - nq, dim = (np.shape(X)) - [self.res, self.query_dists], self.stats = self.index.batch_search_numpy_input(X, dim, nq, k, self.Ls, self.BW, self.threads) - self.stats["dist_comps"] = self.stats["mean_dist_comps"] * nq - - def range_query(self, X, radius): - """ - Carry out a batch query for range search with - radius. - """ - nq, dim = np.shape(X) - [self.rangeres_lim, [self.rangeres_ids, self.rangeres_dists]], self.stats = self.index.batch_range_search_numpy_input( - X, dim, nq, radius, self.Lmin, self.Lmax, self.BW, self.threads) - self.stats["dist_comps"] = self.stats["mean_dist_comps"] * nq - - def get_range_results(self): - return (self.rangeres_lim, self.rangeres_dists, self.rangeres_ids) - - def get_additional(self): - return self.stats - - def set_query_arguments(self, query_args): - self._query_args = query_args - self.Ls = 0 if query_args.get("Ls") == None else query_args.get("Ls") - self.Lmin = 0 if query_args.get("Lmin") == None else query_args.get("Lmin") - self.Lmax = 0 if query_args.get("Lmax") == None else query_args.get("Lmax") - self.BW = self._query_args.get("BW") - self.threads = self._query_args.get("T") diff --git a/benchmark/algorithms/elastiknn.py b/benchmark/algorithms/elastiknn.py deleted file mode 100644 index e69de29bb..000000000 diff --git a/benchmark/algorithms/faiss_inmem.py b/benchmark/algorithms/faiss_inmem.py deleted file mode 100644 index 4c5803edb..000000000 --- a/benchmark/algorithms/faiss_inmem.py +++ /dev/null @@ -1,75 +0,0 @@ -from __future__ import absolute_import -#import sys -#sys.path.append("install/lib-faiss") # noqa -import numpy -import sklearn.preprocessing -import ctypes -import faiss -import os -from benchmark.algorithms.base import BaseANN -from benchmark.datasets import DATASETS - - -class Faiss(BaseANN): - def query(self, X, n): - if self._metric == 'angular': - X /= numpy.linalg.norm(X) - self.res = self.index.search(X.astype(numpy.float32), n) - - def get_results(self): - D, I = self.res - return I -# res = [] -# for i in range(len(D)): -# r = [] -# for l, d in zip(L[i], D[i]): -# if l != -1: -# r.append(l) -# res.append(r) -# return res - - -class FaissIVF(Faiss): - def __init__(self, metric, n_list): - self._n_list = n_list - self._metric = metric - - def index_name(self, name): - return f"data/ivf_{name}_{self._n_list}_{self._metric}" - - def fit(self, dataset): - X = DATASETS[dataset]().get_dataset() # assumes it fits into memory - - if self._metric == 'angular': - X = sklearn.preprocessing.normalize(X, axis=1, norm='l2') - - if X.dtype != numpy.float32: - X = X.astype(numpy.float32) - - self.quantizer = faiss.IndexFlatL2(X.shape[1]) - index = faiss.IndexIVFFlat( - self.quantizer, X.shape[1], self._n_list, faiss.METRIC_L2) - index.train(X) - index.add(X) - faiss.write_index(index, self.index_name(dataset)) - self.index = index - - def load_index(self, dataset): - if not os.path.exists(self.index_name(dataset)): - return False - - self.index = faiss.read_index(self.index_name(dataset)) - return True - - def set_query_arguments(self, n_probe): - faiss.cvar.indexIVF_stats.reset() - self._n_probe = n_probe - self.index.nprobe = self._n_probe - - def get_additional(self): - return {"dist_comps": faiss.cvar.indexIVF_stats.ndis + # noqa - faiss.cvar.indexIVF_stats.nq * self._n_list} - - def __str__(self): - return 'FaissIVF(n_list=%d, n_probe=%d)' % (self._n_list, - self._n_probe) diff --git a/benchmark/algorithms/faiss_t1.py b/benchmark/algorithms/faiss_t1.py deleted file mode 100644 index 75684c427..000000000 --- a/benchmark/algorithms/faiss_t1.py +++ /dev/null @@ -1,314 +0,0 @@ -from __future__ import absolute_import -import numpy as np -import sklearn.preprocessing -import ctypes -import faiss -import os -import time -from benchmark.algorithms.base import BaseANN -from benchmark.datasets import DATASETS, download_accelerated - -def knn_search_batched(index, xq, k, bs): - D, I = [], [] - for i0 in range(0, len(xq), bs): - Di, Ii = index.search(xq[i0:i0 + bs], k) - D.append(Di) - I.append(Ii) - return np.vstack(D), np.vstack(I) - -def unwind_index_ivf(index): - if isinstance(index, faiss.IndexPreTransform): - assert index.chain.size() == 1 - vt = faiss.downcast_VectorTransform(index.chain.at(0)) - index_ivf, vt2 = unwind_index_ivf(faiss.downcast_index(index.index)) - assert vt2 is None - return index_ivf, vt - if hasattr(faiss, "IndexRefine") and isinstance(index, faiss.IndexRefine): - return unwind_index_ivf(faiss.downcast_index(index.base_index)) - if isinstance(index, faiss.IndexIVF): - return index, None - else: - return None, None - -def two_level_clustering(xt, nc1, nc2, clustering_niter=25, spherical=False): - d = xt.shape[1] - - print(f"2-level clustering of {xt.shape} nb clusters = {nc1}*{nc2} = {nc1*nc2}") - print("perform coarse training") - - km = faiss.Kmeans( - d, nc1, verbose=True, niter=clustering_niter, - max_points_per_centroid=2000, - spherical=spherical - ) - km.train(xt) - - print() - - # coarse centroids - centroids1 = km.centroids - - print("assigning the training set") - t0 = time.time() - _, assign1 = km.assign(xt) - bc = np.bincount(assign1, minlength=nc1) - print(f"done in {time.time() - t0:.2f} s. Sizes of clusters {min(bc)}-{max(bc)}") - o = assign1.argsort() - del km - - # train sub-clusters - i0 = 0 - c2 = [] - t0 = time.time() - for c1 in range(nc1): - print(f"[{time.time() - t0:.2f} s] training sub-cluster {c1}/{nc1}\r", end="", flush=True) - i1 = i0 + bc[c1] - subset = o[i0:i1] - assert np.all(assign1[subset] == c1) - km = faiss.Kmeans(d, nc2, spherical=spherical) - xtsub = xt[subset] - km.train(xtsub) - c2.append(km.centroids) - i0 = i1 - print(f"done in {time.time() - t0:.2f} s") - return np.vstack(c2) - - -class Faiss(BaseANN): - def __init__(self, metric, index_params): - self._index_params = index_params - self._metric = metric - self._query_bs = -1 - self.indexkey = index_params.get("indexkey", "OPQ32_128,IVF65536_HNSW32,PQ32") - - if 'query_bs' in index_params: - self._query_bs = index_params['query_bs'] - - def track(self): - return "T1" - - def index_name(self, name): - return f"data/{name}.{self.indexkey}.faissindex" - - def fit(self, dataset): - index_params = self._index_params - - ds = DATASETS[dataset]() - d = ds.d - - # get build parameters - buildthreads = index_params.get("buildthreads", -1) - by_residual = index_params.get("by_residual", -1) - maxtrain = index_params.get("maxtrain", 0) - clustering_niter = index_params.get("clustering_niter", -1) - add_bs = index_params.get("add_bs", 100000) - add_splits = index_params.get("add_splits", 1) - efSearch = index_params.get("quantizer_add_efSearch", 80) - efConstruction = index_params.get("quantizer_efConstruction", 200) - use_two_level_clustering = index_params.get("two_level_clustering", True) - indexfile = self.index_name(dataset) - - if buildthreads == -1: - print("Build-time number of threads:", faiss.omp_get_max_threads()) - else: - print("Set build-time number of threads:", buildthreads) - faiss.omp_set_num_threads(buildthreads) - - metric_type = ( - faiss.METRIC_L2 if ds.distance() == "euclidean" else - faiss.METRIC_INNER_PRODUCT if ds.distance() in ("ip", "angular") else - 1/0 - ) - index = faiss.index_factory(d, self.indexkey, metric_type) - - index_ivf, vec_transform = unwind_index_ivf(index) - if vec_transform is None: - vec_transform = lambda x: x - else: - vec_transform = faiss.downcast_VectorTransform(vec_transform) - - if by_residual != -1: - by_residual = by_residual == 1 - print("setting by_residual = ", by_residual) - index_ivf.by_residual # check if field exists - index_ivf.by_residual = by_residual - - if index_ivf: - print("Update add-time parameters") - # adjust default parameters used at add time for quantizers - # because otherwise the assignment is inaccurate - quantizer = faiss.downcast_index(index_ivf.quantizer) - if isinstance(quantizer, faiss.IndexRefine): - print(" update quantizer k_factor=", quantizer.k_factor, end=" -> ") - quantizer.k_factor = 32 if index_ivf.nlist < 1e6 else 64 - print(quantizer.k_factor) - base_index = faiss.downcast_index(quantizer.base_index) - if isinstance(base_index, faiss.IndexIVF): - print(" update quantizer nprobe=", base_index.nprobe, end=" -> ") - base_index.nprobe = ( - 16 if base_index.nlist < 1e5 else - 32 if base_index.nlist < 4e6 else - 64) - print(base_index.nprobe) - elif isinstance(quantizer, faiss.IndexHNSW): - print(" update quantizer efSearch=", quantizer.hnsw.efSearch, end=" -> ") - if index_params.get("quantizer_add_efSearch", 80) > 0: - quantizer.hnsw.efSearch = efSearch - else: - quantizer.hnsw.efSearch = 40 if index_ivf.nlist < 4e6 else 64 - print(quantizer.hnsw.efSearch) - if efConstruction != -1: - print(" update quantizer efConstruction=", quantizer.hnsw.efConstruction, end=" -> ") - quantizer.hnsw.efConstruction = efConstruction - print(quantizer.hnsw.efConstruction) - - - index.verbose = True - if index_ivf: - index_ivf.verbose = True - index_ivf.quantizer.verbose = True - index_ivf.cp.verbose = True - - - if maxtrain == 0: - if 'IMI' in self.indexkey: - maxtrain = int(256 * 2 ** (np.log2(index_ivf.nlist) / 2)) - elif index_ivf: - maxtrain = 50 * index_ivf.nlist - else: - # just guess... - maxtrain = 256 * 100 - maxtrain = max(maxtrain, 256 * 100) - print("setting maxtrain to %d" % maxtrain) - - # train on dataset - print(f"getting first {maxtrain} dataset vectors for training") - - xt2 = next(ds.get_dataset_iterator(bs=maxtrain)) - - print("train, size", xt2.shape) - assert np.all(np.isfinite(xt2)) - - t0 = time.time() - - if (isinstance(vec_transform, faiss.OPQMatrix) and - isinstance(index_ivf, faiss.IndexIVFPQFastScan)): - print(" Forcing OPQ training PQ to PQ4") - ref_pq = index_ivf.pq - training_pq = faiss.ProductQuantizer( - ref_pq.d, ref_pq.M, ref_pq.nbits - ) - vec_transform.pq - vec_transform.pq = training_pq - - if clustering_niter >= 0: - print(("setting nb of clustering iterations to %d" % - clustering_niter)) - index_ivf.cp.niter = clustering_niter - - train_index = None - - if use_two_level_clustering: - sqrt_nlist = int(np.sqrt(index_ivf.nlist)) - assert sqrt_nlist ** 2 == index_ivf.nlist - - centroids_trainset = xt2 - if isinstance(vec_transform, faiss.VectorTransform): - print(" training vector transform") - vec_transform.train(xt2) - print(" transform trainset") - centroids_trainset = vec_transform.apply_py(centroids_trainset) - - centroids = two_level_clustering( - centroids_trainset, sqrt_nlist, sqrt_nlist, - spherical=(metric_type == faiss.METRIC_INNER_PRODUCT) - ) - - if not index_ivf.quantizer.is_trained: - print(" training quantizer") - index_ivf.quantizer.train(centroids) - - print(" add centroids to quantizer") - index_ivf.quantizer.add(centroids) - - index.train(xt2) - print(" Total train time %.3f s" % (time.time() - t0)) - - if train_index is not None: - del train_index - index_ivf.clustering_index = None - gc.collect() - - print("adding") - - t0 = time.time() - add_bs = index_params.get("add_bs", 10000000) - if add_bs == -1: - index.add(ds.get_database()) - else: - i0 = 0 - for xblock in ds.get_dataset_iterator(bs=add_bs): - i1 = i0 + len(xblock) - print(" adding %d:%d / %d [%.3f s, RSS %d kiB] " % ( - i0, i1, ds.nb, time.time() - t0, - faiss.get_mem_usage_kb())) - index.add(xblock) - i0 = i1 - - print(" add in %.3f s" % (time.time() - t0)) - print("storing", ) - faiss.write_index(index, self.index_name(dataset)) - - self.index = index - self.ps = faiss.ParameterSpace() - self.ps.initialize(self.index) - - def load_index(self, dataset): - if not os.path.exists(self.index_name(dataset)): - if 'url' not in self._index_params: - return False - - print('Downloading index in background. This can take a while.') - download_accelerated(self._index_params['url'], self.index_name(dataset), quiet=True) - - print("Loading index") - - self.index = faiss.read_index(self.index_name(dataset)) - - self.ps = faiss.ParameterSpace() - self.ps.initialize(self.index) - - return True - - def set_query_arguments(self, query_args): - faiss.cvar.indexIVF_stats.reset() - self.ps.set_index_parameters(self.index, query_args) - self.qas = query_args - - - # shall we return something interesting here? - def get_additional(self): - return {"dist_comps": faiss.cvar.indexIVF_stats.ndis} - - def __str__(self): - return f'FaissIVFPQ({self.qas})' - - - - def query(self, X, n): - if self._query_bs == -1: - self.res = self.index.search(X, n) - else: - self.res = knn_search_batched(self.index, X, n, self._query_bs) - - def range_query(self, X, radius): - if self._query_bs != -1: - raise NotImplemented - self.res = self.index.range_search(X, radius) - - def get_results(self): - D, I = self.res - return I - - def get_range_results(self): - return self.res diff --git a/benchmark/algorithms/faiss_t3.py b/benchmark/algorithms/faiss_t3.py deleted file mode 100644 index 622e121b1..000000000 --- a/benchmark/algorithms/faiss_t3.py +++ /dev/null @@ -1,475 +0,0 @@ -from __future__ import absolute_import -import numpy as np -import sklearn.preprocessing -import ctypes -import faiss -import os -import time -import gc -import resource -import threading -import json - -from multiprocessing.pool import ThreadPool - -from benchmark.algorithms.base import BaseANN -from benchmark.datasets import DATASETS, download_accelerated - -def unwind_index_ivf(index): - if isinstance(index, faiss.IndexPreTransform): - assert index.chain.size() == 1 - vt = index.chain.at(0) - index_ivf, vt2 = unwind_index_ivf(faiss.downcast_index(index.index)) - assert vt2 is None - return index_ivf, vt - if hasattr(faiss, "IndexRefine") and isinstance(index, faiss.IndexRefine): - return unwind_index_ivf(faiss.downcast_index(index.base_index)) - if isinstance(index, faiss.IndexIVF): - return index, None - else: - return None, None - -def rate_limited_iter(l): - 'a thread pre-processes the next element' - pool = ThreadPool(1) - res = None - - def next_or_None(): - try: - return next(l) - except StopIteration: - return None - - while True: - res_next = pool.apply_async(next_or_None) - if res is not None: - res = res.get() - if res is None: - return - yield res - res = res_next - -def build_index(buildthreads, by_residual, maxtrain, clustering_niter, - indexkey, indexfile, add_bs, add_splits, ds, train_on_gpu=True, quantizer_on_gpu_add=True): - - nq, d = ds.nq, ds.d - nb, d = ds.nq, ds.d - - if buildthreads == -1: - print("Build-time number of threads:", faiss.omp_get_max_threads()) - else: - print("Set build-time number of threads:", buildthreads) - faiss.omp_set_num_threads(buildthreads) - - metric_type = ( - faiss.METRIC_L2 if ds.distance() == "euclidean" else - faiss.METRIC_INNER_PRODUCT if ds.distance() in ("ip", "angular") else - 1/0 - ) - index = faiss.index_factory(d, indexkey, metric_type) - - index_ivf, vec_transform = unwind_index_ivf(index) - if vec_transform is None: - vec_transform = lambda x: x - else: - vec_transform = faiss.downcast_VectorTransform(vec_transform) - - if by_residual != -1: - by_residual = by_residual == 1 - index_ivf.by_residual # check if field exists - index_ivf.by_residual = by_residual - - if index_ivf: - print("Update add-time parameters") - # adjust default parameters used at add time for quantizers - # because otherwise the assignment is inaccurate - quantizer = faiss.downcast_index(index_ivf.quantizer) - if isinstance(quantizer, faiss.IndexRefine): - print(" update quantizer k_factor=", quantizer.k_factor, end=" -> ") - quantizer.k_factor = 32 if index_ivf.nlist < 1e6 else 64 - print(quantizer.k_factor) - base_index = faiss.downcast_index(quantizer.base_index) - if isinstance(base_index, faiss.IndexIVF): - print(" update quantizer nprobe=", base_index.nprobe, end=" -> ") - base_index.nprobe = ( - 16 if base_index.nlist < 1e5 else - 32 if base_index.nlist < 4e6 else - 64) - print(base_index.nprobe) - - index.verbose = True - if index_ivf: - index_ivf.verbose = True - index_ivf.quantizer.verbose = True - index_ivf.cp.verbose = True - - if maxtrain == 0: - if 'IMI' in indexkey: - maxtrain = int(256 * 2 ** (np.log2(index_ivf.nlist) / 2)) - elif index_ivf: - maxtrain = 50 * index_ivf.nlist - else: - # just guess... - maxtrain = 256 * 100 - maxtrain = max(maxtrain, 256 * 100) - print("setting maxtrain to %d" % maxtrain) - - # train on dataset - print(f"getting first {maxtrain} dataset vectors for training") - - xt2 = next(ds.get_dataset_iterator(bs=maxtrain)) - - print("train, size", xt2.shape) - assert np.all(np.isfinite(xt2)) - - t0 = time.time() - - if (isinstance(vec_transform, faiss.OPQMatrix) and - isinstance(index_ivf, faiss.IndexIVFPQFastScan)): - print(" Forcing OPQ training PQ to PQ4") - ref_pq = index_ivf.pq - training_pq = faiss.ProductQuantizer( - ref_pq.d, ref_pq.M, ref_pq.nbits - ) - vec_transform.pq - vec_transform.pq = training_pq - - if clustering_niter >= 0: - print(("setting nb of clustering iterations to %d" % - clustering_niter)) - index_ivf.cp.niter = clustering_niter - - train_index = None - if train_on_gpu: - print("add a training index on GPU") - train_index = faiss.index_cpu_to_all_gpus( - faiss.IndexFlatL2(index_ivf.d)) - index_ivf.clustering_index = train_index - - index.train(xt2) - print(" Total train time %.3f s" % (time.time() - t0)) - - if train_index is not None: - del train_index - index_ivf.clustering_index = None - gc.collect() - - print("adding") - - t0 = time.time() - - if not quantizer_on_gpu_add: - i0 = 0 - for xblock in ds.get_dataset_iterator(bs=add_bs): - i1 = i0 + len(xblock) - print(" adding %d:%d / %d [%.3f s, RSS %d kiB] " % ( - i0, i1, ds.nb, time.time() - t0, - faiss.get_mem_usage_kb())) - index.add(xblock) - i0 = i1 - elif True: - quantizer_gpu = faiss.index_cpu_to_all_gpus(index_ivf.quantizer) - - nsplit = add_splits - - def produce_batches(sno): - for xblock in ds.get_dataset_iterator(bs=add_bs, split=(nsplit, sno)): - _, assign = quantizer_gpu.search(xblock, 1) - yield xblock, assign.ravel() - - i0 = 0 - for sno in range(nsplit): - print(f"============== SPLIT {sno}/{nsplit}") - - stage2 = rate_limited_iter(produce_batches(sno)) - for xblock, assign in stage2: - i1 = i0 + len(xblock) - print(" adding %d:%d / %d [%.3f s, RSS %d kiB] " % ( - i0, i1, ds.nb, time.time() - t0, - faiss.get_mem_usage_kb())) - index.add_core( - len(xblock), - faiss.swig_ptr(xblock), - None, - faiss.swig_ptr(assign) - ) - i0 = i1 - del quantizer_gpu - gc.collect() - - print(" add in %.3f s" % (time.time() - t0)) - if indexfile: - print("storing", indexfile) - faiss.write_index(index, indexfile) - - return index - -class IndexQuantizerOnGPU: - """ run query quantization on GPU """ - - def __init__(self, index, search_bs): - self.search_bs = search_bs - index_ivf, vec_transform = unwind_index_ivf(index) - self.index_ivf = index_ivf - if vec_transform: -# print(type(vec_transform),dir(vec_transform)) - self.vec_transform = vec_transform.apply - else: - self.vec_transform = None - self.quantizer_gpu = faiss.index_cpu_to_all_gpus(self.index_ivf.quantizer) - - - def produce_batches(self, x, bs): - n = len(x) - nprobe = self.index_ivf.nprobe - ivf_stats = faiss.cvar.indexIVF_stats - for i0 in range(0, n, bs): - xblock = x[i0:i0 + bs] - t0 = time.time() - D, I = self.quantizer_gpu.search(xblock, nprobe) - ivf_stats.quantization_time += 1000 * (time.time() - t0) - yield i0, xblock, D, I - - - def search(self, x, k): - - if x.dtype!=np.float32: #GW- why do we need this now? - x = x.astype( np.float32 ) - - bs = self.search_bs - if self.vec_transform: - x = self.vec_transform(x) - nprobe = self.index_ivf.nprobe - n, d = x.shape - assert self.index_ivf.d == d - D = np.empty((n, k), dtype=np.float32) - I = np.empty((n, k), dtype=np.int64) - - sp = faiss.swig_ptr - stage2 = rate_limited_iter(self.produce_batches(x, bs)) - t0 = time.time() - for i0, xblock, Dc, Ic in stage2: - ni = len(xblock) - self.index_ivf.search_preassigned( - ni, faiss.swig_ptr(xblock), - k, sp(Ic), sp(Dc), - sp(D[i0:]), sp(I[i0:]), - False - ) - - return D, I - - def range_search(self, x, radius): - - x = x.astype( np.float32 ) #GW - why do we need this now? - - bs = self.search_bs - if self.vec_transform: - x = self.vec_transform(x) - nprobe = self.index_ivf.nprobe - n, d = x.shape - assert self.index_ivf.d == d - - sp = faiss.swig_ptr - rsp = faiss.rev_swig_ptr - stage2 = rate_limited_iter(self.produce_batches(x, bs)) - t0 = time.time() - all_res = [] - nres = 0 - for i0, xblock, Dc, Ic in stage2: - ni = len(xblock) - res = faiss.RangeSearchResult(ni) - - self.index_ivf.range_search_preassigned( - ni, faiss.swig_ptr(xblock), - radius, sp(Ic), sp(Dc), - res - ) - all_res.append((ni, res)) - lims = rsp(res.lims, ni + 1) - nres += lims[-1] - nres = int(nres) - lims = np.zeros(n + 1, int) - I = np.empty(nres, int) - D = np.empty(nres, 'float32') - - n0 = 0 - for ni, res in all_res: - lims_i = rsp(res.lims, ni + 1) - nd = int(lims_i[-1]) - Di = rsp(res.distances, nd) - Ii = rsp(res.labels, nd) - i0 = int(lims[n0]) - lims[n0: n0 + ni + 1] = lims_i + i0 - I[i0:i0 + nd] = Ii - D[i0:i0 + nd] = Di - n0 += ni - - return lims, D, I - - -class FaissT3(BaseANN): - def __init__(self, metric, index_params): - self._index_params = index_params - self._metric = metric - - def track(self): - return "T3" - - def index_name(self, name): - return f"data/{name}.{self._index_params['indexkey']}.faissindex" - - def fit(self, dataset): - index_params = self._index_params - - ds = DATASETS[dataset]() - d = ds.d - - # get build parameters - buildthreads = index_params.get("buildthreads", -1) - by_residual = index_params.get("by_residual", -1) - maxtrain = index_params.get("maxtrain", 0) - clustering_niter = index_params.get("clustering_niter", -1) - indexkey = index_params.get("indexkey", "IVF1048576,SQ8") - add_bs = index_params.get("add_bs", 100000) - add_splits = index_params.get("add_splits", 1) - indexfile = self.index_name(dataset) - - # determine how we use the GPU - #search_type = ds.search_type() - #if search_type == "knn": - # train_on_gpu = True - # quantizer_on_gpu_add = True - #else: #range - # train_on_gpu = False - # quantizer_on_gpu_add = False - - index = build_index(buildthreads, by_residual, maxtrain, clustering_niter, indexkey, - indexfile, add_bs, add_splits, ds) - - index_ivf, vec_transform = unwind_index_ivf(index) - if vec_transform is None: - vec_transform = lambda x: x - if index_ivf is not None: - print("imbalance_factor=", index_ivf.invlists.imbalance_factor()) - - no_precomputed_tables = index_params.get("no_precomputed_tables", True) - if no_precomputed_tables: - if isinstance(index_ivf, faiss.IndexIVFPQ): - print("disabling precomputed table") - index_ivf.use_precomputed_table = -1 - index_ivf.precomputed_table.clear() - - precomputed_table_size = 0 - if hasattr(index_ivf, 'precomputed_table'): - precomputed_table_size = index_ivf.precomputed_table.size() * 4 - print("precomputed tables size:", precomputed_table_size) - - searchthreads = index_params.get("searchthreads", -1) - if searchthreads == -1: - print("Search threads:", faiss.omp_get_max_threads()) - else: - print("Setting nb of threads to", searchthreads) - faiss.omp_set_num_threads(searchthreads) - - parallel_mode = index_params.get("parallel_mode", 3) - if parallel_mode != -1: - print("setting IVF parallel mode to", parallel_mode) - index_ivf.parallel_mode - index_ivf.parallel_mode = parallel_mode - - # prep for the searches - - self.ps = faiss.ParameterSpace() - self.ps.initialize(index) - - search_bs = index_params.get("search_bs", 8192) - index_wrap = IndexQuantizerOnGPU(index, search_bs) - - self.cpuindex = index - self.index = index_wrap - - def load_index(self, dataset): - - index_params = self._index_params - - if not os.path.exists(self.index_name(dataset)): - if 'url' not in self._index_params: - return False - - print('Downloading index in background. This can take a while.') - download_accelerated(self._index_params['url'], self.index_name(dataset), quiet=True) - - print("Loading index",self.index_name(dataset)) - - index = faiss.read_index(self.index_name(dataset)) - - index_ivf, vec_transform = unwind_index_ivf(index) - if vec_transform is None: - vec_transform = lambda x: x - if index_ivf is not None: - print("imbalance_factor=", index_ivf.invlists.imbalance_factor()) - - no_precomputed_tables = index_params.get("no_precomputed_tables", True) - if no_precomputed_tables: - if isinstance(index_ivf, faiss.IndexIVFPQ): - print("disabling precomputed table") - index_ivf.use_precomputed_table = -1 - index_ivf.precomputed_table.clear() - - precomputed_table_size = 0 - if hasattr(index_ivf, 'precomputed_table'): - precomputed_table_size = index_ivf.precomputed_table.size() * 4 - print("precomputed tables size:", precomputed_table_size) - - # prep for the searches - - searchthreads = index_params.get("searchthreads", -1) - if searchthreads == -1: - print("Search threads:", faiss.omp_get_max_threads()) - else: - print("Setting nb of threads to", searchthreads) - faiss.omp_set_num_threads(searchthreads) - - parallel_mode = index_params.get("parallel_mode", 3) - if parallel_mode != -1: - print("setting IVF parallel mode to", parallel_mode) - index_ivf.parallel_mode - index_ivf.parallel_mode = parallel_mode - - self.ps = faiss.ParameterSpace() - self.ps.initialize(index) - - search_bs = index_params.get("search_bs", 8092) - index_wrap = IndexQuantizerOnGPU(index, search_bs) - - self.cpuindex = index - self.index = index_wrap - - return True - - def set_query_arguments(self, query_args): - faiss.cvar.indexIVF_stats.reset() - self.ps.set_index_parameters(self.cpuindex, query_args) - self.qas = query_args - - - # shall we return something interesting here? - def get_additional(self): - return {"dist_comps": faiss.cvar.indexIVF_stats.ndis} - - def __str__(self): - return f'FaissIVFPQ({self.qas})' - - def query(self, X, n): - self.res = self.index.search(X, n) - - def range_query(self, X, radius): - self.res = self.index.range_search(X, radius) - - def get_results(self): - D, I = self.res - return I - - def get_range_results(self): - return self.res diff --git a/benchmark/algorithms/gemini.py b/benchmark/algorithms/gemini.py deleted file mode 100644 index ea261fd95..000000000 --- a/benchmark/algorithms/gemini.py +++ /dev/null @@ -1,279 +0,0 @@ -from __future__ import absolute_import -import numpy as np -import sklearn.preprocessing -import ctypes -import faiss -import os -import time -import ast -from tqdm import tqdm - -from benchmark.algorithms.base import BaseANN -from benchmark.datasets import DATASETS, download_accelerated - -# GSL stuff -import gdl_bindings as gdl -import gsl_bindings as gsl -from tmp_api import * -import gsl_utils -import gsld_bindings_rerank as gsld_rerank - -def convert_index_to_cluster_and_ids_lists(index, nbits): - cluster_list = np.empty(index.invlists.nlist, dtype=object) - ids_list = np.empty(index.invlists.nlist, dtype=object) - - zero_count = 0 - - for i in range(index.invlists.nlist): - list_sz = index.invlists.list_size(i) - - if list_sz == 0: - zero_count = zero_count + 1 - ids = None - else: - ids_ptr = index.invlists.get_ids(i) - ids = np.array(faiss.rev_swig_ptr(ids_ptr, list_sz)).reshape(-1, 1).astype(np.uint32) # GSL requires a 2d arrray for some reason - index.invlists.release_ids(ids_ptr) - # index.invlists.release_ids(list_sz, ids_ptr) - ids_list[i] = ids - - codes_ptr = index.invlists.get_codes(i) - codes = np.array(faiss.rev_swig_ptr(codes_ptr, list_sz * nbits // 8)).reshape(list_sz, nbits//8) - index.invlists.release_codes(codes_ptr) - # index.invlists.release_codes(list_sz * nbits // 8, codes_ptr) - cluster_list[i] = codes - - print('zero_count =', zero_count) - return cluster_list, ids_list - -def get_cluster_and_ids_lists(index, nbits): - print('Creating cluster + ids lists...') - ret = convert_index_to_cluster_and_ids_lists(index, nbits) - return ret - -def create_encoding(encoding_file_name, normalize=False): - print("FILE LOAD PATH", encoding_file_name) - single_np_array = np.load(encoding_file_name) - # contains 6 arrays in a particular order - layers = [NHEncoding.NHLayer(single_np_array[0], single_np_array[1].reshape(1, len(single_np_array[1]))), - NHEncoding.NHLayer(single_np_array[2], single_np_array[3].reshape(1, len(single_np_array[3]))), - NHEncoding.NHLayer(single_np_array[4], single_np_array[5].reshape(1, len(single_np_array[5])))] - [ print(l.shape) for l in single_np_array ] - return NHEncoding(layers, normalize) - -class GeminiT3(BaseANN): - def __init__(self, metric, index_params): - # GSL init - s = gdl.gdl_init() - if s: - raise Exception('gdl.gdl_init() failed with {}'.format(s)) - s, n_gdl_ctxs = gdl.gdl_context_count_get() - if s: - raise Exception('gdl.gdl_context_count_get() failed with {}'.format(s)) - - s, gdl_desc_list = gdl.gdl_context_desc_get(n_gdl_ctxs) - if s: - raise Exception('gdl.gdl_context_desc_get() failed with {}'.format(s)) - - gdl_ctx_ids = [desc.ctx_id for desc in gdl_desc_list if desc.status == gdl.GDL_CONTEXT_READY] - if not gdl_ctx_ids: - raise Exception("No valid context found") - - self._index_params = index_params - self._metric = metric - self.index_params = ast.literal_eval(index_params) - num_apuc = self.index_params['num_apuc'] - print("NUM_APUC", num_apuc) - self.gsl_ctx = Context(gdl_ctx_ids[:num_apuc], max_num_threads=56) - # GSL init end - - self.max_num_queries = 10000 - self.num_records = 1000000000 - - print(f'GSI GeminiT3(BaseANN){self.index_params}') - - def index_name(self, name): - nlist = self.index_params['nlist'] - qbits = self.index_params['qbits'] - nbits = self.index_params['nbits'] - nt = self.index_params['nt'] - is_f16 = self.index_params['f16'] - key = "nbits=%d,qbits=%d,nlist=%d,nt=%d,f16=%s" % (nbits, qbits, nlist, nt, str(is_f16)) - return f"data/{name}.{key}.geminiindex" - - def fit(self, dataset): - assert 0 - - def load_index(self, dataset): - - nlist = self.index_params['nlist'] - qbits = self.index_params['qbits'] - nbits = self.index_params['nbits'] - nt = self.index_params['nt'] - is_f16 = self.index_params['f16'] - - # number of centroids maps to an index subdir - centroids_dirs = { 524288: 'centroids_512k/', 2097152: 'centroids_2m/', 4194304: 'centroids_4m/'} - num_centroids_dir = centroids_dirs[nlist] - - # the index name is the parent folder of the index component files - prefix = self.index_name( dataset ) - - resources_path = '' - case_dir = '1b/' - resources_path_case = f'{resources_path}{case_dir}' - - fp_quantizer_file_name = f'{prefix}/{resources_path}{num_centroids_dir}Deep1B.nt{nt}.nlist{nlist}.quantizer' - records_encoding_file_name = f'{prefix}/{resources_path}records_weights/records_weights.bits{nbits}.npy' - centroids_encoding_file_name = f'{prefix}/{resources_path}{num_centroids_dir}centroids_weights.nt{nt}.nlist{nlist}.nbits{nbits}.npy' - index_file_name = f'{prefix}/{resources_path_case}Deep1B.ivfbinnh.nt{nt}.nlist{nlist}.nb{self.num_records}.bits{qbits}.index' - db_path = f'{prefix}/{resources_path_case}fdb.npy' - - print('********************** Paths ***************************') - print('fp_quantizer_file_name =', fp_quantizer_file_name) - if not os.path.isfile(fp_quantizer_file_name): - raise FileNotFoundError(fp_quantizer_file_name) - print('records_encoding_file_name =', records_encoding_file_name) - if not os.path.isfile(records_encoding_file_name): - raise FileNotFoundError(records_encoding_file_name) - print('centroids_encoding_file_name =', centroids_encoding_file_name) - if not os.path.isfile(centroids_encoding_file_name): - raise FileNotFoundError(centroids_encoding_file_name) - print('index_file_name =', index_file_name) - if not os.path.isfile(index_file_name): - raise FileNotFoundError(index_file_name) - print('db_path =', db_path) - if not os.path.isfile(db_path): - raise FileNotFoundError(db_path) - print('********************************************************') - - self.centroids_encoding = create_encoding(centroids_encoding_file_name, False) - print("centroids", centroids_encoding_file_name, self.centroids_encoding) - self.records_encoding = create_encoding(records_encoding_file_name, False) - print("records", records_encoding_file_name, self.records_encoding) - - print('load XF deep-1B') - num_features = 96 - dtype = gsld_rerank.GSLD_RERANK_DATA_TYPE_FLOAT - - print('init rerank...') - self.rerank = gsld_rerank.init(self.num_records, num_features, num_features * 4, dtype, gsld_rerank.GSLD_RERANK_ALGO_L2, is_f16, db_path) - print('finished init rerank') - - print(f'GSI loading index:{index_file_name}') - self.index = faiss.read_index_binary(index_file_name) - - # cluster_list, ids_list = get_cluster_and_ids_lists(self.index, nbits) - cluster_list, ids_list = get_cluster_and_ids_lists(self.index, qbits) - - print('creating GSL cluster binary DB...') - self.clstr_bdb = self.gsl_ctx.create_cluster_bdb(cluster_list, ids_list) - del cluster_list - del ids_list - - quantizer = faiss.downcast_IndexBinary(self.index.quantizer) - centroids = faiss.vector_to_array(quantizer.xb) - centroids = np.reshape(centroids, (quantizer.ntotal, quantizer.d//8)) - self.centroids_bdb = self.gsl_ctx.create_bdb(centroids) - del centroids - - l2_quantizer = faiss.read_index(fp_quantizer_file_name) - l2_centroids = faiss.vector_float_to_array(l2_quantizer.xb) - l2_centroids = np.reshape(l2_centroids, (nlist, l2_quantizer.d)) - print('centroids (float):', l2_centroids.shape, l2_centroids.dtype) - print('creating GSL centroids float DB...') - self.centroids_fdb = self.gsl_ctx.create_fdb(l2_centroids, False) - - self.centroids_encoding = create_encoding(centroids_encoding_file_name, False) - print("centroids", centroids_encoding_file_name, self.centroids_encoding) - self.records_encoding = create_encoding(records_encoding_file_name, False) - print("records", records_encoding_file_name, self.records_encoding) - - return True - - def set_query_arguments(self, query_args): - - #destroy previous runs' seesion - try: - print('destroying search session') - self.session_hdl.destroy() - except AttributeError: - print('no session to destroy') - - typical_num_queries = self.max_num_queries - - self.search_params = ast.literal_eval(query_args) - nprobe = self.search_params['nprobe'] - nprobe_refine = self.search_params['nprobe_refine'] - hamming_k = self.search_params['hamming_k'] - average_clstr_size_factor = self.search_params['average_clstr_size_factor'] - - print('--->', 'nprobe =', nprobe, 'nprobe_refine =', nprobe_refine, 'hamming_k =', hamming_k, - 'average_clstr_size_factor =', average_clstr_size_factor) - - rerank_desc = RerankDesc(self.centroids_fdb, nprobe_refine, gsl.GSL_ALG_KNN_L2_FDB) - - desc = ClusterHammingDesc(self.max_num_queries, - typical_num_queries, - self.centroids_bdb, - nprobe, - hamming_k, - rerank_desc, - self.centroids_encoding, - self.records_encoding, - self.clstr_bdb, - average_clstr_size_factor) - - self.session_hdl = self.gsl_ctx.create_session(desc) - print('Created GSL session') - self.gsl_ctx.search_in_focus(self.session_hdl) - print('Set GSL session in focus') - - def get_additional(self): - return {"dist_comps": faiss.cvar.indexIVF_stats.ndis} - - def __str__(self): - return f'GSI:{self.index_params} {self.search_params}' - - def query(self, X, n): - - print('Performing search on GSL') - out_shape = (X.shape[0], self.search_params['hamming_k']) - outputs = ClusterFlatOutputs(np.empty(out_shape, dtype=np.uint32), np.empty(out_shape, dtype=np.float32)) - out_indices, out_distances = self.gsl_ctx.search(ClusterInputs(X), outputs) - print('Finished search on GSL') - - print('run rerank...') - start = time.time() - res_idx, res_val = gsld_rerank.rerank(self.rerank, X, out_indices, n, 56) - end = time.time() - print('rerank time(milisec): ', (end - start) * 1000) - self.res = out_distances.astype(np.int32), res_idx.astype(np.int64) - - def range_query(self, X, radius): - print('in range query <-----') - - def get_results(self): - print('in get_results <-----') - D, I = self.res - return I - - def get_range_results(self): - print('in get_range_results <-----') - return self.res - - def __del__(self): - print('exit rerank...') - gsld_rerank.exit(self.rerank) - print('destroying search session') - self.session_hdl.destroy() - print('destroying centroids float DB') - self.centroids_fdb.destroy() - print('destroying centroids binary DB') - self.centroids_bdb.destroy() - print('destroying cluster binary DB') - self.clstr_bdb.destroy() - del self.gsl_ctx - s = gdl.gdl_exit() - if s: - raise Exception('gdl.gdl_exit failed with {}'.format(s)) diff --git a/benchmark/algorithms/httpann.py b/benchmark/algorithms/httpann.py deleted file mode 100644 index 36cbccfb5..000000000 --- a/benchmark/algorithms/httpann.py +++ /dev/null @@ -1,125 +0,0 @@ -import shlex -import sys -import time -from subprocess import Popen -from threading import Thread - -import numpy as np -import requests - -from benchmark.algorithms.base import BaseANN - - -class HttpANN(BaseANN): - """ - HTTP-based ANN algorithm. - Designed to enable language-agnostic ANN by delegating indexing and querying to a separate HTTP server. - - The HTTP server must satisfy the following API. - - | Method | Route | Request Body | Expected Status | Response Body | - | ------ | -------------------- | ---------------------------------------------------------------------------------------------------------- | --------------- | -------------------------------------------------------------------------- | - | POST | /init | dictionary of constructor arguments, e.g., {"metric": "euclidean", "dimension": 99 } | 200 | { } | - | POST | /load_index | { "dataset": } | 200 | { "load_index": } | - | POST | /fit | { "dataset": } | 200 | { } | - | POST | /set_query_arguments | dictionary of query arguments | 200 | { } | - | POST | /query | { "X": , "k": } | 200 | { } | - | POST | /range_query | { "X": , “radius”: } | 200 | { } | - | POST | /get_results | { } | 200 | { "get_results": } | - | POST | /get_additional | { } | 200 | { "get_additional": } | - | POST | /get_range_results | { } | 200 | { "get_range_results": } | - - Note that this is a 1:1 copy of the BaseANN Python Class API implemented as remote procedure calls. - """ - - def __init__(self, server_url: str, start_seconds: int, name: str, **kwargs): - """ - Base constructor for an HttpANN algorithm. - @param server_url: base URL for the server including port, e.g., "http:localhost:8080" - @param start_seconds: how many seconds to wait for the server to start before posting to the /init endpoint. - @param name: algorithm name - @param kwargs: any additional keyword arguments that will be passed through to the /init endpoint. - """ - self.server_url = server_url - self.name = name - - # Used by get_results method, defined in query method. - self.res = [] - - # Let the server start and post to init. - time.sleep(start_seconds) - self.post("init", kwargs, 200) - - def post(self, path: str, body: dict, expected_status: int) -> dict: - url = f"{self.server_url}/{path}" - res = requests.post(url, json=body) - if res.status_code != expected_status: - raise HttpANNResponseError(url, expected_status, res.status_code) - return res.json() - - def fit(self, dataset): - body = dict(dataset=dataset) - self.post("fit", body, 200) - - def load_index(self, dataset): - body = dict(dataset=dataset) - json = self.post("load_index", body, 200) - return json["load_index"] - - def query(self, X, k): - body = dict(X=[arr.tolist() for arr in X], k=k) - self.post("query", body, 200) - - def range_query(self, X, radius): - body = dict(X=[arr.tolist() for arr in X], radius=radius) - self.post("range_query", body, 200) - - def get_results(self): - json = self.post("get_results", dict(), 200) - return np.array(json["get_results"]) - - def get_range_results(self): - json = self.post("get_range_results", dict(), 200) - [lims, I, D] = json["get_range_results"] - return np.array(lims, 'int32'), np.array(I, 'int32'), np.array(D, 'float32') - - def get_additional(self): - json = self.post("get_additional", dict(), 200) - return json["get_additional"] - - def set_query_arguments(self, *query_args): - body = dict(query_args=query_args) - self.post("set_query_arguments", body, 200) - - -class HttpANNError(RuntimeError): - """Custom error type""" - pass - - -class HttpANNResponseError(HttpANNError): - """Custom error type""" - - def __init__(self, endpoint: str, expected_status: int, actual_status: int): - super(HttpANNError, self).__init__(f"Endpoint {endpoint} expected {expected_status} but got {actual_status}") - - -class HttpANNSubprocess(object): - """ - Helper class to start the HTTP server as a local subprocess. - Starts a background thread to monitor the subprocess by checking for an exit code once per second. - If the background thread finds an exit code, it will raise an HttpANNError. - """ - - def __init__(self, server_subprocess_command: str): - proc = Popen(shlex.split(server_subprocess_command), stdout=sys.stdout, stderr=sys.stderr) - - def monitor(): - while True: - time.sleep(1) - poll = proc.poll() - if poll is not None: - raise HttpANNError(f"HTTP server subprocess prematurely returned status code {poll}.") - - t = Thread(target=monitor, args=(), daemon=True) - t.start() diff --git a/benchmark/algorithms/httpann_example.py b/benchmark/algorithms/httpann_example.py deleted file mode 100644 index a6b876be0..000000000 --- a/benchmark/algorithms/httpann_example.py +++ /dev/null @@ -1,154 +0,0 @@ -import numpy as np -from flask import Flask, request, jsonify -from sklearn.neighbors import NearestNeighbors - -from benchmark.datasets import DATASETS -from .httpann import HttpANN, HttpANNSubprocess - - -class HttpANNExampleAlgorithm(HttpANN, HttpANNSubprocess): - """ - ANN algorithm that serves as a standard "algorithm" (callable from runner.py) and manages an HTTP server that - implements the actual indexing and query processing algorithms. - - By implementing HttpANNSubprocess, it starts a local server (which is implemented further below in the same file). - By implementing HttpANN, it can be used by runner.py to make ANN requests from Python to the local server. - - Obviously this is a contrived setup, as the actual algorithm is also implemented in Python. - It's purely as an example of how one might run an algorithm from another language by using an HTTP server to - implement the server API expected by HttpANN. - """ - - def __init__(self, metric: str, dimension: int, use_dims: float): - HttpANNSubprocess.__init__(self, "python3 -m benchmark.algorithms.httpann_example example") - HttpANN.__init__(self, server_url="http://localhost:8080", start_seconds=3, - name=f"http-ann-example-{metric}-{use_dims}", metric=metric, dimension=dimension, - use_dims=use_dims) - - -# Starts a local flask server that adheres to the HttpANN API and delegates the work to a local ANN algorithm. -def main(): - class SimpleANNAlgo(object): - """ - Very simple ANN algorithm intended only to demonstrate the HttpANN functionality. - This algorithm is instantiated and called from the example server below. - The algorithm is approximate in the sense that it uses exact KNN constrained to a configurable subset of the - highest variance dimensions. For example, if dimensions=100 and use_dims=0.22, the algorithm picks the 22 - dimensions with the highest variance and use them for exact KNN. - """ - - def __init__(self, metric: str, dimension: int, use_dims: float = 0.1): - self.metric = metric - self.dimension = dimension - self.use_dims = use_dims - self.knn = None - self.high_variance_dims = None - self.res = None - - def fit(self, dataset): - ds = DATASETS[dataset]() - arr = ds.get_dataset() - var = arr.var(axis=0) - num_dims = int(self.use_dims * arr.shape[1]) - self.high_variance_dims = np.argsort(var)[-num_dims:] - self.knn = NearestNeighbors(algorithm='brute', metric=self.metric) - self.knn.fit(arr[:, self.high_variance_dims]) - - def load_index(self, dataset): - # Always returns false because the index is not stored. - return False - - def query(self, X, k): - self.res = self.knn.kneighbors(X[:, self.high_variance_dims], n_neighbors=k, return_distance=False) - - def range_query(self, X, radius): - nbrs, dsts = self.knn.radius_neighbors(X[:, self.high_variance_dims], radius=radius, return_distance=True) - total = sum(map(len, nbrs)) - lims = np.zeros(len(X) + 1, 'int32') - I = np.zeros(total, 'int32') - D = np.zeros(total, 'float32') - for i in range(len(X)): - lims[i + 1] = lims[i] + len(nbrs[i]) - I[lims[i]:lims[i + 1]] = nbrs[i] - D[lims[i]:lims[i + 1]] = dsts[i] - self.res = (lims, I, D) - - def get_results(self): - return self.res - - def get_range_results(self): - return self.res - - def get_additional(self): - return {} - - app = Flask(__name__) - - # Algorithm is instantiated later but needs to be attached to an object. - app.algo = None - - @app.route("/status", methods=['GET']) - def status(): - return jsonify(dict()), 200 - - @app.route("/init", methods=['POST']) - def init(): - app.algo = SimpleANNAlgo(**request.json) - return jsonify(dict()), 200 - - @app.route("/load_index", methods=['POST']) - def load_index(): - b = app.algo.load_index(**request.json) - return jsonify(dict(load_index=b)), 200 - - @app.route("/fit", methods=['POST']) - def fit(): - app.algo.fit(**request.json) - return jsonify(dict()), 200 - - @app.route("/set_query_arguments", methods=['POST']) - def set_query_arguments(): - app.algo.set_query_arguments(**request.json) - return jsonify(dict()), 200 - - @app.route("/query", methods=['POST']) - def query(): - j = request.json - app.algo.query(np.array(j['X']), j['k']) - return jsonify(dict()), 200 - - @app.route("/range_query", methods=['POST']) - def range_query(): - j = request.json - app.algo.range_query(np.array(j['X']), j['radius']) - return jsonify(dict()), 200 - - @app.route("/get_results", methods=['POST']) - def get_results(): - neighbors = [arr.tolist() for arr in app.algo.res] - return jsonify(dict(get_results=neighbors)), 200 - - @app.route("/get_range_results", methods=['POST']) - def get_range_results(): - lims, I, D = app.algo.get_range_results() - res = [ - lims.tolist(), - [arr.tolist() for arr in I], - [arr.tolist() for arr in D] - ] - return jsonify(dict(get_range_results=res)), 200 - - @app.route("/get_additional", methods=['POST']) - def get_additional(): - return jsonify(dict(get_additional=app.algo.get_additional())), 200 - - app.run('0.0.0.0', 8080, debug=False) - # We could also use gevent/wsgi for a more professional setup. - # https://flask.palletsprojects.com/en/2.0.x/deploying/wsgi-standalone/#gevent - # from gevent.pywsgi import WSGIServer - # http_server = WSGIServer(('0.0.0.0', 8080), app) - # http_server.serve_forever() - - -if __name__ == "__main__": - main() diff --git a/benchmark/datasets.py b/benchmark/datasets.py deleted file mode 100644 index 368e646b2..000000000 --- a/benchmark/datasets.py +++ /dev/null @@ -1,737 +0,0 @@ -import math -import numpy -import os -import random -import sys -import struct -import time - -import numpy as np - -from urllib.request import urlopen -from urllib.request import urlretrieve - -BASEDIR = "data/" - -def download(src, dst=None, max_size=None): - """ download an URL, possibly cropped """ - if os.path.exists(dst): - return - print('downloading %s -> %s...' % (src, dst)) - if max_size is not None: - print(" stopping at %d bytes" % max_size) - t0 = time.time() - outf = open(dst, "wb") - inf = urlopen(src) - info = dict(inf.info()) - content_size = int(info['Content-Length']) - bs = 1 << 20 - totsz = 0 - while True: - block = inf.read(bs) - elapsed = time.time() - t0 - print( - " [%.2f s] downloaded %.2f MiB / %.2f MiB at %.2f MiB/s " % ( - elapsed, - totsz / 2**20, content_size / 2**20, - totsz / 2**20 / elapsed), - flush=True, end="\r" - ) - if not block: - break - if max_size is not None and totsz + len(block) >= max_size: - block = block[:max_size - totsz] - outf.write(block) - totsz += len(block) - break - outf.write(block) - totsz += len(block) - print() - print("download finished in %.2f s, total size %d bytes" % ( - time.time() - t0, totsz - )) - - -def download_accelerated(src, dst, quiet=False, sas_string=""): - """ dowload using an accelerator. Make sure the executable is in the path """ - print('downloading %s -> %s...' % (src, dst)) - if "windows.net" in src: - if sas_string == "": - cmd = f"azcopy copy {src} {dst}" - else: - cmd = f"azcopy copy '{src}?{sas_string}' '{dst}'" - else: - cmd = f"axel --alternate -n 10 {src} -o {dst}" - if quiet: - cmd += " -q" - - print("running", cmd) - ret = os.system(cmd) - assert ret == 0 - -def upload_accelerated(local_dir, blob_prefix, component, sas_string, quiet=False): - """ Upload index component to Azure blob using SAS string""" - src = os.path.join(local_dir, component) - dst = blob_prefix + '/' + component + '?' + sas_string - print('Uploading %s -> %s...' % (src, dst)) - - cmd = f"azcopy copy '{src}' '{dst}'" - print("running", cmd) - ret = os.system(cmd) - assert ret == 0 - - -def bvecs_mmap(fname): - x = numpy.memmap(fname, dtype='uint8', mode='r') - d = x[:4].view('int32')[0] - return x.reshape(-1, d + 4)[:, 4:] - -def ivecs_read(fname): - a = numpy.fromfile(fname, dtype='int32') - d = a[0] - return a.reshape(-1, d + 1)[:, 1:].copy() - -def xbin_mmap(fname, dtype, maxn=-1): - """ mmap the competition file format for a given type of items """ - n, d = map(int, np.fromfile(fname, dtype="uint32", count=2)) - - # HACK - to handle improper header in file for private deep-1B - # if override_d and override_d != d: - # print("Warning: xbin_mmap map returned d=%s, but overridig with %d" % (d, override_d)) - # d = override_d - # HACK - - assert os.stat(fname).st_size == 8 + n * d * np.dtype(dtype).itemsize - if maxn > 0: - n = min(n, maxn) - return np.memmap(fname, dtype=dtype, mode="r", offset=8, shape=(n, d)) - -def range_result_read(fname): - """ read the range search result file format """ - f = open(fname, "rb") - nq, total_res = np.fromfile(f, count=2, dtype="int32") - nres = np.fromfile(f, count=nq, dtype="int32") - assert nres.sum() == total_res - I = np.fromfile(f, count=total_res, dtype="int32") - D = np.fromfile(f, count=total_res, dtype="float32") - return nres, I, D - -def knn_result_read(fname): - n, d = map(int, np.fromfile(fname, dtype="uint32", count=2)) - assert os.stat(fname).st_size == 8 + n * d * (4 + 4) - f = open(fname, "rb") - f.seek(4+4) - I = np.fromfile(f, dtype="int32", count=n * d).reshape(n, d) - D = np.fromfile(f, dtype="float32", count=n * d).reshape(n, d) - return I, D - -def read_fbin(filename, start_idx=0, chunk_size=None): - """ Read *.fbin file that contains float32 vectors - Args: - :param filename (str): path to *.fbin file - :param start_idx (int): start reading vectors from this index - :param chunk_size (int): number of vectors to read. - If None, read all vectors - Returns: - Array of float32 vectors (numpy.ndarray) - """ - with open(filename, "rb") as f: - nvecs, dim = np.fromfile(f, count=2, dtype=np.int32) - nvecs = (nvecs - start_idx) if chunk_size is None else chunk_size - arr = np.fromfile(f, count=nvecs * dim, dtype=np.float32, - offset=start_idx * 4 * dim) - return arr.reshape(nvecs, dim) - - -def read_ibin(filename, start_idx=0, chunk_size=None): - """ Read *.ibin file that contains int32 vectors - Args: - :param filename (str): path to *.ibin file - :param start_idx (int): start reading vectors from this index - :param chunk_size (int): number of vectors to read. - If None, read all vectors - Returns: - Array of int32 vectors (numpy.ndarray) - """ - with open(filename, "rb") as f: - nvecs, dim = np.fromfile(f, count=2, dtype=np.int32) - nvecs = (nvecs - start_idx) if chunk_size is None else chunk_size - arr = np.fromfile(f, count=nvecs * dim, dtype=np.int32, - offset=start_idx * 4 * dim) - return arr.reshape(nvecs, dim) - - -def sanitize(x): - return numpy.ascontiguousarray(x, dtype='float32') - - -class Dataset(): - def prepare(self): - """ - Download and prepare dataset, queries, groundtruth. - """ - pass - def get_dataset_fn(self): - """ - Return filename of dataset file. - """ - pass - def get_dataset(self): - """ - Return memmapped version of the dataset. - """ - pass - def get_dataset_iterator(self, bs=512, split=(1, 0)): - """ - Return iterator over blocks of dataset of size at most 512. - The split argument takes a pair of integers (n, p) where p = 0..n-1 - The dataset is split in n shards, and the iterator returns only shard #p - This makes it possible to process the dataset independently from several - processes / threads. - """ - pass - def get_queries(self): - """ - Return (nq, d) array containing the nq queries. - """ - pass - def get_private_queries(self): - """ - Return (private_nq, d) array containing the private_nq private queries. - """ - pass - def get_groundtruth(self, k=None): - """ - Return (nq, k) array containing groundtruth indices - for each query.""" - pass - - def search_type(self): - """ - "knn" or "range" - """ - pass - - def distance(self): - """ - "euclidean" or "ip" or "angular" - """ - pass - - def default_count(self): - return 10 - - def short_name(self): - return f"{self.__class__.__name__}-{self.nb}" - - def __str__(self): - return ( - f"Dataset {self.__class__.__name__} in dimension {self.d}, with distance {self.distance()}, " - f"search_type {self.search_type()}, size: Q {self.nq} B {self.nb}") - - -############################################################################# -# Datasets for the competition -############################################################################## - - - -class DatasetCompetitionFormat(Dataset): - """ - Dataset in the native competition format, that is able to read the - files in the https://big-ann-benchmarks.com/ page. - The constructor should set all fields. The functions below are generic. - - For the 10M versions of the dataset, the database files are downloaded in - part and stored with a specific suffix. This is to avoid having to maintain - two versions of the file. - """ - - def prepare(self, skip_data=False): - if not os.path.exists(self.basedir): - os.makedirs(self.basedir) - - # start with the small ones... - for fn in [self.qs_fn, self.gt_fn]: - if fn is None: - continue - if fn.startswith("https://"): - sourceurl = fn - outfile = os.path.join(self.basedir, fn.split("/")[-1]) - else: - sourceurl = os.path.join(self.base_url, fn) - outfile = os.path.join(self.basedir, fn) - if os.path.exists(outfile): - print("file %s already exists" % outfile) - continue - download(sourceurl, outfile) - - # private qs url - if self.private_qs_url: - outfile = os.path.join(self.basedir, self.private_qs_url.split("/")[-1]) - if os.path.exists(outfile): - print("file %s already exists" % outfile) - else: - download(self.private_qs_url, outfile) - - # private gt url - if self.private_gt_url: - outfile = os.path.join(self.basedir, self.private_gt_url.split("/")[-1]) - if os.path.exists(outfile): - print("file %s already exists" % outfile) - else: - download(self.private_gt_url, outfile) - - if skip_data: - return - - fn = self.ds_fn - sourceurl = os.path.join(self.base_url, fn) - outfile = os.path.join(self.basedir, fn) - if os.path.exists(outfile): - print("file %s already exists" % outfile) - return - if self.nb == 10**9: - download_accelerated(sourceurl, outfile) - else: - # download cropped version of file - file_size = 8 + self.d * self.nb * np.dtype(self.dtype).itemsize - outfile = outfile + '.crop_nb_%d' % self.nb - if os.path.exists(outfile): - print("file %s already exists" % outfile) - return - download(sourceurl, outfile, max_size=file_size) - # then overwrite the header... - header = np.memmap(outfile, shape=2, dtype='uint32', mode="r+") - assert header[0] == 10**9 - assert header[1] == self.d - header[0] = self.nb - - def get_dataset_fn(self): - fn = os.path.join(self.basedir, self.ds_fn) - if os.path.exists(fn): - return fn - if self.nb != 10**9: - fn += '.crop_nb_%d' % self.nb - return fn - else: - raise RuntimeError("file not found") - - def get_dataset_iterator(self, bs=512, split=(1,0)): - nsplit, rank = split - i0, i1 = self.nb * rank // nsplit, self.nb * (rank + 1) // nsplit - filename = self.get_dataset_fn() - x = xbin_mmap(filename, dtype=self.dtype, maxn=self.nb) - assert x.shape == (self.nb, self.d) - for j0 in range(i0, i1, bs): - j1 = min(j0 + bs, i1) - yield sanitize(x[j0:j1]) - - def search_type(self): - return "knn" - - def get_groundtruth(self, k=None): - assert self.gt_fn is not None - fn = self.gt_fn.split("/")[-1] # in case it's a URL - assert self.search_type() == "knn" - - I, D = knn_result_read(os.path.join(self.basedir, fn)) - assert I.shape[0] == self.nq - if k is not None: - assert k <= 100 - I = I[:, :k] - D = D[:, :k] - return I, D - - def get_dataset(self): - assert self.nb <= 10**7, "dataset too large, use iterator" - return sanitize(next(self.get_dataset_iterator(bs=self.nb))) - - def get_queries(self): - filename = os.path.join(self.basedir, self.qs_fn) - x = xbin_mmap(filename, dtype=self.dtype) - assert x.shape == (self.nq, self.d) - return sanitize(x) - - def get_private_queries(self): - assert self.private_qs_url is not None - fn = self.private_qs_url.split("/")[-1] # in case it's a URL - filename = os.path.join(self.basedir, fn) - x = xbin_mmap(filename, dtype=self.dtype) - assert x.shape == (self.private_nq, self.d) - return sanitize(x) - - def get_private_groundtruth(self, k=None): - assert self.private_gt_url is not None - fn = self.private_gt_url.split("/")[-1] # in case it's a URL - assert self.search_type() == "knn" - - I, D = knn_result_read(os.path.join(self.basedir, fn)) - assert I.shape[0] == self.private_nq - if k is not None: - assert k <= 100 - I = I[:, :k] - D = D[:, :k] - return I, D - -subset_url = "https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/" - -class SSNPPDataset(DatasetCompetitionFormat): - def __init__(self, nb_M=1000): - # assert nb_M in (10, 1000) - self.nb_M = nb_M - self.nb = 10**6 * nb_M - self.d = 256 - self.nq = 100000 - self.dtype = "uint8" - self.ds_fn = "FB_ssnpp_database.u8bin" - self.qs_fn = "FB_ssnpp_public_queries.u8bin" - self.gt_fn = ( - "FB_ssnpp_public_queries_1B_GT.rangeres" if self.nb_M == 1000 else - subset_url + "GT_100M/ssnpp-100M" if self.nb_M == 100 else - subset_url + "GT_10M/ssnpp-10M" if self.nb_M == 10 else - None - ) - - self.base_url = "https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/" - self.basedir = os.path.join(BASEDIR, "FB_ssnpp") - - self.private_nq = 100000 - self.private_qs_url = "https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/FB_ssnpp_heldout_queries_3307fba121460a56.u8bin" - self.private_gt_url = "https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/GT_1B_final_2bf4748c7817/FB_ssnpp.bin" - - def search_type(self): - return "range" - - def default_count(self): - return 96237 - - def distance(self): - return "euclidean" - - def get_groundtruth(self, k=None): - """ override the ground-truth function as this is the only range search dataset """ - assert self.gt_fn is not None - fn = self.gt_fn.split("/")[-1] # in case it's a URL - return range_result_read(os.path.join(self.basedir, fn)) - - def get_private_groundtruth(self, k=None): - """ override the ground-truth function as this is the only range search dataset """ - assert self.private_gt_url is not None - fn = self.private_gt_url.split("/")[-1] # in case it's a URL - return range_result_read(os.path.join(self.basedir, fn)) - -class BigANNDataset(DatasetCompetitionFormat): - def __init__(self, nb_M=1000): - self.nb_M = nb_M - self.nb = 10**6 * nb_M - self.d = 128 - self.nq = 10000 - self.dtype = "uint8" - self.ds_fn = "base.1B.u8bin" - self.qs_fn = "query.public.10K.u8bin" - self.gt_fn = ( - "GT.public.1B.ibin" if self.nb_M == 1000 else - subset_url + "GT_100M/bigann-100M" if self.nb_M == 100 else - subset_url + "GT_10M/bigann-10M" if self.nb_M == 10 else - None - ) - # self.gt_fn = "https://comp21storage.blob.core.windows.net/publiccontainer/comp21/bigann/public_query_gt100.bin" if self.nb == 10**9 else None - self.base_url = "https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/bigann/" - self.basedir = os.path.join(BASEDIR, "bigann") - - self.private_nq = 10000 - self.private_qs_url = "https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/bigann/query.private.799253207.10K.u8bin" - self.private_gt_url = "https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/GT_1B_final_2bf4748c7817/bigann-1B.bin" - - - def distance(self): - return "euclidean" - -class Deep1BDataset(DatasetCompetitionFormat): - def __init__(self, nb_M=1000): - self.nb_M = nb_M - self.nb = 10**6 * nb_M - self.d = 96 - self.nq = 10000 - self.dtype = "float32" - self.ds_fn = "base.1B.fbin" - self.qs_fn = "query.public.10K.fbin" - self.gt_fn = ( - "https://storage.yandexcloud.net/yandex-research/ann-datasets/deep_new_groundtruth.public.10K.bin" if self.nb_M == 1000 else - subset_url + "GT_100M/deep-100M" if self.nb_M == 100 else - subset_url + "GT_10M/deep-10M" if self.nb_M == 10 else - None - ) - self.base_url = "https://storage.yandexcloud.net/yandex-research/ann-datasets/DEEP/" - self.basedir = os.path.join(BASEDIR, "deep1b") - - self.private_nq = 30000 - self.private_qs_url = "https://comp21storage.blob.core.windows.net/publiccontainer/comp21/deep1b/query.heldout.30K.fbin" - self.private_gt_url = "https://comp21storage.blob.core.windows.net/publiccontainer/comp21/deep1b/gt100-heldout.30K.fbin" - - self.private_nq_large = 1000000 - self.private_qs_large_url = "https://storage.yandexcloud.net/yr-secret-share/ann-datasets-5ac0659e27/DEEP/query.private.1M.fbin" - - def distance(self): - return "euclidean" - - - -class Text2Image1B(DatasetCompetitionFormat): - def __init__(self, nb_M=1000): - self.nb_M = nb_M - self.nb = 10**6 * nb_M - self.d = 200 - self.nq = 100000 - self.dtype = "float32" - self.ds_fn = "base.1B.fbin" - self.qs_fn = "query.public.100K.fbin" - self.gt_fn = ( - "https://storage.yandexcloud.net/yandex-research/ann-datasets/t2i_new_groundtruth.public.100K.bin" if self.nb_M == 1000 else - subset_url + "GT_100M/text2image-100M" if self.nb_M == 100 else - subset_url + "GT_10M/text2image-10M" if self.nb_M == 10 else - None - ) - self.base_url = "https://storage.yandexcloud.net/yandex-research/ann-datasets/T2I/" - self.basedir = os.path.join(BASEDIR, "text2image1B") - - self.private_nq = 30000 - self.private_qs_url = "https://comp21storage.blob.core.windows.net/publiccontainer/comp21/text2image1b/query.heldout.30K.fbin" - self.private_gt_url = "https://comp21storage.blob.core.windows.net/publiccontainer/comp21/text2image1b/gt100-heldout.30K.fbin" - - self.private_nq_large = 1000000 - self.private_qs_large_url = "https://storage.yandexcloud.net/yr-secret-share/ann-datasets-5ac0659e27/T2I/query.private.1M.fbin" - - def distance(self): - return "ip" - - def get_query_train(self, maxn=10**6): - xq_train = np.memmap( - BASEDIR + "/text2image1B/query.learn.50M.fbin", offset=8, - dtype='float32', shape=(maxn, 200), mode='r') - return np.array(xq_train) - -class MSTuringANNS(DatasetCompetitionFormat): - def __init__(self, nb_M=1000): - self.nb_M = nb_M - self.nb = 10**6 * nb_M - self.d = 100 - self.nq = 100000 - self.dtype = "float32" - self.ds_fn = "base1b.fbin" - self.qs_fn = "query100K.fbin" - self.gt_fn = ( - "query_gt100.bin" if self.nb_M == 1000 else - subset_url + "GT_100M/msturing-100M" if self.nb_M == 100 else - subset_url + "GT_10M/msturing-10M" if self.nb_M == 10 else - None - ) - self.base_url = "https://comp21storage.blob.core.windows.net/publiccontainer/comp21/MSFT-TURING-ANNS/" - self.basedir = os.path.join(BASEDIR, "MSTuringANNS") - - self.private_nq = 10000 - self.private_qs_url = "https://comp21storage.blob.core.windows.net/publiccontainer/comp21/MSFT-TURING-ANNS/testQuery10K.fbin" - self.private_gt_url = "https://comp21storage.blob.core.windows.net/publiccontainer/comp21/MSFT-TURING-ANNS/gt100-private10K-queries.bin" - - self.private_nq_large = 99605 - self.private_qs_large_url = "https://comp21storage.blob.core.windows.net/publiccontainer/comp21/MSFT-TURING-ANNS/testQuery99605.fbin" - self.private_gt_large_url = "https://comp21storage.blob.core.windows.net/publiccontainer/comp21/MSFT-TURING-ANNS/gt100-private99605-queries.bin" - - def distance(self): - return "euclidean" - - -class MSSPACEV1B(DatasetCompetitionFormat): - def __init__(self, nb_M=1000): - self.nb_M = nb_M - self.nb = 10**6 * nb_M - self.d = 100 - self.nq = 29316 - self.dtype = "int8" - self.ds_fn = "spacev1b_base.i8bin" - self.qs_fn = "query.i8bin" - self.gt_fn = ( - "public_query_gt100.bin" if self.nb_M == 1000 else - subset_url + "GT_100M/msspacev-100M" if self.nb_M == 100 else - subset_url + "GT_10M/msspacev-10M" if self.nb_M == 10 else - None - ) - self.base_url = "https://comp21storage.blob.core.windows.net/publiccontainer/comp21/spacev1b/" - self.basedir = os.path.join(BASEDIR, "MSSPACEV1B") - - self.private_nq = 30000 - self.private_qs_url = "https://comp21storage.blob.core.windows.net/publiccontainer/comp21/spacev1b/private_query_30k.bin" - self.private_gt_url = "https://comp21storage.blob.core.windows.net/publiccontainer/comp21/spacev1b/gt100_private_query_30k.bin" - - def distance(self): - return "euclidean" - -class RandomRangeDS(DatasetCompetitionFormat): - def __init__(self, nb, nq, d): - self.nb = nb - self.nq = nq - self.d = d - self.dtype = 'float32' - self.ds_fn = f"data_{self.nb}_{self.d}" - self.qs_fn = f"queries_{self.nq}_{self.d}" - self.gt_fn = f"gt_{self.nb}_{self.nq}_{self.d}" - self.basedir = os.path.join(BASEDIR, f"random{self.nb}") - if not os.path.exists(self.basedir): - os.makedirs(self.basedir) - - def prepare(self, skip_data=False): - import sklearn.datasets - import sklearn.model_selection - from sklearn.neighbors import NearestNeighbors - - print(f"Preparing datasets with {self.nb} random points and {self.nq} queries.") - - - X, _ = sklearn.datasets.make_blobs( - n_samples=self.nb + self.nq, n_features=self.d, - centers=self.nq, random_state=1) - - data, queries = sklearn.model_selection.train_test_split( - X, test_size=self.nq, random_state=1) - - - with open(os.path.join(self.basedir, self.ds_fn), "wb") as f: - np.array([self.nb, self.d], dtype='uint32').tofile(f) - data.astype('float32').tofile(f) - with open(os.path.join(self.basedir, self.qs_fn), "wb") as f: - np.array([self.nq, self.d], dtype='uint32').tofile(f) - queries.astype('float32').tofile(f) - - print("Computing groundtruth") - - nbrs = NearestNeighbors(n_neighbors=100, metric="euclidean", algorithm='brute').fit(data) - D, I = nbrs.kneighbors(queries) - - nres = np.count_nonzero((D < math.sqrt(self.default_count())) == True, axis=1) - DD = np.zeros(nres.sum()) - II = np.zeros(nres.sum(), dtype='int32') - - s = 0 - for i, l in enumerate(nres): - DD[s : s + l] = D[i, 0 : l] - II[s : s + l] = I[i, 0 : l] - s += l - - with open(os.path.join(self.basedir, self.gt_fn), "wb") as f: - np.array([self.nq, nres.sum()], dtype='uint32').tofile(f) - nres.astype('int32').tofile(f) - II.astype('int32').tofile(f) - DD.astype('float32').tofile(f) - - def get_groundtruth(self, k=None): - """ override the ground-truth function as this is the only range search dataset """ - assert self.gt_fn is not None - fn = self.gt_fn.split("/")[-1] # in case it's a URL - return range_result_read(os.path.join(self.basedir, fn)) - - def search_type(self): - return "range" - - def default_count(self): - return 49 - - def distance(self): - return "euclidean" - - def __str__(self): - return f"RandomRange({self.nb})" - -class RandomDS(DatasetCompetitionFormat): - def __init__(self, nb, nq, d): - self.nb = nb - self.nq = nq - self.d = d - self.dtype = 'float32' - self.ds_fn = f"data_{self.nb}_{self.d}" - self.qs_fn = f"queries_{self.nq}_{self.d}" - self.gt_fn = f"gt_{self.nb}_{self.nq}_{self.d}" - self.basedir = os.path.join(BASEDIR, f"random{self.nb}") - if not os.path.exists(self.basedir): - os.makedirs(self.basedir) - - def prepare(self, skip_data=False): - import sklearn.datasets - import sklearn.model_selection - from sklearn.neighbors import NearestNeighbors - - print(f"Preparing datasets with {self.nb} random points and {self.nq} queries.") - - - X, _ = sklearn.datasets.make_blobs( - n_samples=self.nb + self.nq, n_features=self.d, - centers=self.nq, random_state=1) - - data, queries = sklearn.model_selection.train_test_split( - X, test_size=self.nq, random_state=1) - - - with open(os.path.join(self.basedir, self.ds_fn), "wb") as f: - np.array([self.nb, self.d], dtype='uint32').tofile(f) - data.astype('float32').tofile(f) - with open(os.path.join(self.basedir, self.qs_fn), "wb") as f: - np.array([self.nq, self.d], dtype='uint32').tofile(f) - queries.astype('float32').tofile(f) - - print("Computing groundtruth") - - nbrs = NearestNeighbors(n_neighbors=100, metric="euclidean", algorithm='brute').fit(data) - D, I = nbrs.kneighbors(queries) - with open(os.path.join(self.basedir, self.gt_fn), "wb") as f: - np.array([self.nq, 100], dtype='uint32').tofile(f) - I.astype('uint32').tofile(f) - D.astype('float32').tofile(f) - - def search_type(self): - return "knn" - - def distance(self): - return "euclidean" - - def __str__(self): - return f"Random({self.nb})" - - def default_count(self): - return 10 - - -DATASETS = { - 'bigann-1B': lambda : BigANNDataset(1000), - 'bigann-100M': lambda : BigANNDataset(100), - 'bigann-10M': lambda : BigANNDataset(10), - - 'deep-1B': lambda : Deep1BDataset(), - 'deep-100M': lambda : Deep1BDataset(100), - 'deep-10M': lambda : Deep1BDataset(10), - - 'ssnpp-1B': lambda : SSNPPDataset(1000), - 'ssnpp-10M': lambda : SSNPPDataset(10), - 'ssnpp-100M': lambda : SSNPPDataset(100), - 'ssnpp-1M': lambda : SSNPPDataset(1), - - 'text2image-1B': lambda : Text2Image1B(), - 'text2image-1M': lambda : Text2Image1B(1), - 'text2image-10M': lambda : Text2Image1B(10), - 'text2image-100M': lambda : Text2Image1B(100), - - 'msturing-1B': lambda : MSTuringANNS(1000), - 'msturing-1M': lambda : MSTuringANNS(1), - 'msturing-10M': lambda : MSTuringANNS(10), - 'msturing-100M': lambda : MSTuringANNS(100), - - 'msspacev-1B': lambda : MSSPACEV1B(1000), - 'msspacev-10M': lambda : MSSPACEV1B(10), - 'msspacev-100M': lambda : MSSPACEV1B(100), - 'msspacev-1M': lambda : MSSPACEV1B(1), - - 'random-xs': lambda : RandomDS(10000, 1000, 20), - 'random-s': lambda : RandomDS(100000, 1000, 50), - - 'random-range-xs': lambda : RandomRangeDS(10000, 1000, 20), - 'random-range-s': lambda : RandomRangeDS(100000, 1000, 50), -} diff --git a/benchmark/distances.py b/benchmark/distances.py deleted file mode 100644 index 7a013697c..000000000 --- a/benchmark/distances.py +++ /dev/null @@ -1,16 +0,0 @@ -from scipy.spatial.distance import pdist as scipy_pdist -import itertools -import numpy as np - -def pdist(a, b, metric): - return scipy_pdist([a, b], metric=metric)[0] - -metrics = { - 'euclidean': { - 'distance': lambda a, b: pdist(a, b, "euclidean"), - }, - 'angular': { - 'distance': lambda a, b: pdist(a, b, "cosine"), - } -} - diff --git a/benchmark/main.py b/benchmark/main.py deleted file mode 100644 index 5f0a63059..000000000 --- a/benchmark/main.py +++ /dev/null @@ -1,250 +0,0 @@ -from __future__ import absolute_import -import argparse -import logging -import logging.config - -import docker -import multiprocessing.pool -import os -import psutil -import random -import shutil -import sys -import traceback - -from benchmark.datasets import DATASETS -from benchmark.algorithms.definitions import (get_definitions, - list_algorithms, - algorithm_status, - InstantiationStatus) -from benchmark.results import get_result_filename -from benchmark.runner import run, run_docker, run_no_docker - -from benchmark.sensors.power_capture import power_capture - -def positive_int(s): - i = None - try: - i = int(s) - except ValueError: - pass - if not i or i < 1: - raise argparse.ArgumentTypeError("%r is not a positive integer" % s) - return i - - -def run_worker(args, queue): - print("RW", args) - while not queue.empty(): - definition = queue.get() - memory_margin = 500e6 # reserve some extra memory for misc stuff - mem_limit = int((psutil.virtual_memory().available - memory_margin)) - #mem_limit = 128e9 # 128gb for competition - cpu_limit = "0-%d" % (multiprocessing.cpu_count() - 1) - - if args.nodocker: - run_no_docker(definition, args.dataset, args.count, - args.runs, args.timeout, args.rebuild, cpu_limit, mem_limit, - args.t3, args.power_capture, - args.upload_index, args.download_index, - args.blob_prefix, args.sas_string, - args.private_query) - - else: - run_docker(definition, args.dataset, args.count, - args.runs, args.timeout, args.rebuild, cpu_limit, mem_limit, - args.t3, args.power_capture, - args.upload_index, args.download_index, - args.blob_prefix, args.sas_string, - args.private_query) - - -def main(): - parser = argparse.ArgumentParser( - formatter_class=argparse.ArgumentDefaultsHelpFormatter) - parser.add_argument( - '--dataset', - metavar='NAME', - help='the dataset to load training points from', - default='sift-1M', - choices=DATASETS.keys()) - parser.add_argument( - "-k", "--count", - default=-1, - type=int, - help="the number of near neighbours to search for") - parser.add_argument( - '--definitions', - metavar='FILE', - help='load algorithm definitions from FILE', - default='algos.yaml') - parser.add_argument( - '--algorithm', - metavar='NAME', - help='run only the named algorithm', - default=None) - parser.add_argument( - '--docker-tag', - metavar='NAME', - help='run only algorithms in a particular docker image', - default=None) - parser.add_argument( - '--list-algorithms', - help='print the names of all known algorithms and exit', - action='store_true') - parser.add_argument( - '--force', - help='re-run algorithms even if their results already exist', - action='store_true') - parser.add_argument( - '--rebuild', - help='re-build index even if it exists', - action='store_true') - parser.add_argument( - '--runs', - metavar='COUNT', - type=positive_int, - help='run each algorithm instance %(metavar)s times and use only' - ' the best result', - default=5) - parser.add_argument( - '--timeout', - type=int, - help='Timeout (in seconds) for each individual algorithm run, or -1' - 'if no timeout should be set', - default=12 * 3600) - parser.add_argument( - '--max-n-algorithms', - type=int, - help='Max number of algorithms to run (just used for testing)', - default=-1) - parser.add_argument( - '--power-capture', - help='Power capture parameters for the T3 competition. ' - 'Format is "ip:port:capture_time_in seconds" (ie, 127.0.0.1:3000:10).', - default="") - parser.add_argument( - '--t3', - help='Run as a T3 participant.', - action='store_true') - parser.add_argument( - '--nodocker', - help='Override default of invoking algorithm in docker container.', - action='store_true') - parser.add_argument( - '--upload-index', - help='Upload index to Azure blob storage and avoid local queries.', - action='store_true') - parser.add_argument( - '--download-index', - help='Download index uploaded to Azure blob storage and run local queries.', - action='store_true') - parser.add_argument( - '--blob-prefix', - help='Azure blob prefix to upload indices to and download indices from.' - ) - parser.add_argument( - '--sas-string', - help='SAS string to authenticate to Azure blob storage.' - ) - parser.add_argument( - '--private-query', - help='Use the new set of private queries that were not released during the competition period.', - action='store_true' - ) - - - args = parser.parse_args() - if args.timeout == -1: - args.timeout = None - - if args.list_algorithms: - list_algorithms(args.definitions) - sys.exit(0) - - if args.power_capture: - # validate power capture environment - power_capture( args.power_capture ) - power_capture.ping() - - logging.config.fileConfig("logging.conf") - logger = logging.getLogger("annb") - - dataset = DATASETS[args.dataset]() - dataset.prepare(True) # prepare dataset, but skip potentially huge base vectors - dimension = dataset.d - point_type = 'float' - distance = dataset.distance() - if args.count == -1: - args.count = dataset.default_count() - definitions = get_definitions( - args.definitions, dimension, args.dataset, distance, args.count) - - # Filter out, from the loaded definitions, all those query argument groups - # that correspond to experiments that have already been run. (This might - # mean removing a definition altogether, so we can't just use a list - # comprehension.) - filtered_definitions = [] - for definition in definitions: - query_argument_groups = definition.query_argument_groups - if not query_argument_groups: - query_argument_groups = [[]] - not_yet_run = [] - for query_arguments in query_argument_groups: - if type(query_arguments) != list: - query_arguments = [query_arguments] - fn = get_result_filename(args.dataset, - args.count, definition, - query_arguments) - if args.force or not os.path.exists(fn): - not_yet_run.append(query_arguments) - if not_yet_run: - if definition.query_argument_groups: - definition = definition._replace( - query_argument_groups=not_yet_run) - filtered_definitions.append(definition) - definitions = filtered_definitions - - random.shuffle(definitions) - - if args.algorithm: - logger.info(f'running only {args.algorithm}') - definitions = [d for d in definitions if d.algorithm == args.algorithm] - - if not args.nodocker: - # See which Docker images we have available - docker_client = docker.from_env() - docker_tags = set() - for image in docker_client.images.list(): - for tag in image.tags: - tag = tag.split(':')[0] - docker_tags.add(tag) - - if args.docker_tag: - logger.info(f'running only {args.docker_tag}') - definitions = [ - d for d in definitions if d.docker_tag == args.docker_tag] - - if set(d.docker_tag for d in definitions).difference(docker_tags): - logger.info(f'not all docker images available, only: {set(docker_tags)}') - logger.info(f'missing docker images: ' - f'{str(set(d.docker_tag for d in definitions).difference(docker_tags))}') - definitions = [ - d for d in definitions if d.docker_tag in docker_tags] - - if args.max_n_algorithms >= 0: - definitions = definitions[:args.max_n_algorithms] - - if len(definitions) == 0: - raise Exception('Nothing to run') - else: - logger.info(f'Order: {definitions}') - - queue = multiprocessing.Queue() - for definition in definitions: - queue.put(definition) - #run_worker(args, queue) - workers = [multiprocessing.Process(target=run_worker, args=(args, queue)) - for i in range(1)] - [worker.start() for worker in workers] - [worker.join() for worker in workers] diff --git a/benchmark/plotting/__init__.py b/benchmark/plotting/__init__.py deleted file mode 100644 index a374fb97d..000000000 --- a/benchmark/plotting/__init__.py +++ /dev/null @@ -1,2 +0,0 @@ -from __future__ import absolute_import -from benchmark.plotting import * diff --git a/benchmark/plotting/eval_range_search.py b/benchmark/plotting/eval_range_search.py deleted file mode 100644 index 06b68411d..000000000 --- a/benchmark/plotting/eval_range_search.py +++ /dev/null @@ -1,220 +0,0 @@ -""" -This script contains functions to evaluate the range search results. - -Range search results are represented like a sparse CSR matrix with 3 components: - - lims, I, D - -The results for query #q are: - - I[lims[q]:lims[q + 1]] in int - -And the corresponding distances are: - - D[lims[q]:lims[q + 1]] in float - -Thus, len(lims) = nq + 1, lims[i + 1] >= lims[i] forall i -and len(D) = len(I) = lims[-1]. - -The function that computes the Average Precision measure for -a search result vs. the ground-truth is compute_AP. - -Note that the ground truth format in datasets.py is slightly different: -instead of lims it returns the number of results per query, nres. -The relationship between them is - - nres = lims[1:] - lims[:-1] - -and - - lims = np.zeros(len(nres) + 1, int) - lims[1:] = np.cumsum(nres) - -""" - -import numpy as np -from multiprocessing.pool import ThreadPool - -## code copied from Faiss contrib - -def counts_to_PR(ngt, nres, ninter, mode="overall"): - """ computes a precision-recall for a ser of queries. - ngt = nb of GT results per query - nres = nb of found results per query - ninter = nb of correct results per query (smaller than nres of course) - """ - - if mode == "overall": - ngt, nres, ninter = ngt.sum(), nres.sum(), ninter.sum() - - if nres > 0: - precision = ninter / nres - else: - precision = 1.0 - - if ngt > 0: - recall = ninter / ngt - elif nres == 0: - recall = 1.0 - else: - recall = 0.0 - - return precision, recall - - elif mode == "average": - # average precision and recall over queries - - mask = ngt == 0 - ngt[mask] = 1 - - recalls = ninter / ngt - recalls[mask] = (nres[mask] == 0).astype(float) - - # avoid division by 0 - mask = nres == 0 - assert np.all(ninter[mask] == 0) - ninter[mask] = 1 - nres[mask] = 1 - - precisions = ninter / nres - - return precisions.mean(), recalls.mean() - - else: - raise AssertionError() - - -def sort_range_res_2(lims, D, I): - """ sort 2 arrays using the first as key """ - I2 = np.empty_like(I) - D2 = np.empty_like(D) - nq = len(lims) - 1 - for i in range(nq): - l0, l1 = lims[i], lims[i + 1] - ii = I[l0:l1] - di = D[l0:l1] - o = di.argsort() - I2[l0:l1] = ii[o] - D2[l0:l1] = di[o] - return I2, D2 - - -def sort_range_res_1(lims, I): - I2 = np.empty_like(I) - nq = len(lims) - 1 - for i in range(nq): - l0, l1 = lims[i], lims[i + 1] - I2[l0:l1] = I[l0:l1] - I2[l0:l1].sort() - return I2 - - -def range_PR_multiple_thresholds( - lims_ref, Iref, - lims_new, Dnew, Inew, - thresholds, - mode="overall", do_sort="ref,new" - ): - """ compute precision-recall values for range search results - for several thresholds on the "new" results. - This is to plot PR curves - """ - # ref should be sorted by ids - if "ref" in do_sort: - Iref = sort_range_res_1(lims_ref, Iref) - - # new should be sorted by distances - if "new" in do_sort: - Inew, Dnew = sort_range_res_2(lims_new, Dnew, Inew) - - def ref_result_for(i): - return Iref[lims_ref[i]:lims_ref[i + 1]] - - def new_result_for(i): - l0, l1 = lims_new[i], lims_new[i + 1] - return Inew[l0:l1], Dnew[l0:l1] - - nq = lims_ref.size - 1 - assert lims_new.size - 1 == nq - - nt = len(thresholds) - counts = np.zeros((nq, nt, 3), dtype="int64") - - def compute_PR_for(q): - gt_ids = ref_result_for(q) - res_ids, res_dis = new_result_for(q) - - counts[q, :, 0] = len(gt_ids) - - if res_dis.size == 0: - # the rest remains at 0 - return - - # which offsets we are interested in - nres = np.searchsorted(res_dis, thresholds) - counts[q, :, 1] = nres - - if gt_ids.size == 0: - return - - # find number of TPs at each stage in the result list - ii = np.searchsorted(gt_ids, res_ids) - ii[ii == len(gt_ids)] = -1 - n_ok = np.cumsum(gt_ids[ii] == res_ids) - - # focus on threshold points - n_ok = np.hstack(([0], n_ok)) - counts[q, :, 2] = n_ok[nres] - - pool = ThreadPool(20) - pool.map(compute_PR_for, range(nq)) - # print(counts.transpose(2, 1, 0)) - - precisions = np.zeros(nt) - recalls = np.zeros(nt) - for t in range(nt): - p, r = counts_to_PR( - counts[:, t, 0], counts[:, t, 1], counts[:, t, 2], - mode=mode - ) - precisions[t] = p - recalls[t] = r - - return precisions, recalls - - - -def compute_AP(gt, res): - """ - compute range search average precision. - It works by: - 1. defining a set of thresholds - 2. compute precision, recall for the thresholds - 3. compute AUC of rhe precision-recall curve. - """ - gt_lims, gt_I, gt_D = gt - res_lims, res_I, res_D = res - - if len(res_D) == 0: - return 0.0 - - # start with negative distance to be sure to have the - # (p, r) = (1, 0) point - dmax = res_D.max() - thresholds = np.linspace(-0.001, res_D.max(), 100) - - precisions, recalls = range_PR_multiple_thresholds( - gt_lims, gt_I, - res_lims, res_D, res_I, thresholds) - - # compute average precision using trapezoids - accu = 0 - n = len(precisions) - for i in range(n - 1): - x0, x1 = recalls[i : i + 2] - y0, y1 = precisions[i : i + 2] - accu += (x1 - x0) * (y1 + y0) / 2 - - return accu - - diff --git a/benchmark/plotting/metrics.py b/benchmark/plotting/metrics.py deleted file mode 100644 index 043cb6381..000000000 --- a/benchmark/plotting/metrics.py +++ /dev/null @@ -1,173 +0,0 @@ -from __future__ import absolute_import -import numpy as np -import itertools -import operator -import random -import sys -import copy - -from benchmark.plotting.eval_range_search import compute_AP -from benchmark.sensors.power_capture import power_capture - -def compute_recall_without_distance_ties(true_ids, run_ids, count): - return len(set(true_ids) & set(run_ids)) - -def compute_recall_with_distance_ties(true_ids, true_dists, run_ids, count): - # This function assumes "true_dists" is monotonic either increasing or decreasing - - found_tie = False - gt_size = np.shape(true_dists)[0] - - if gt_size==count: - # nothing fancy to do in this case - recall = len(set(true_ids[:count]) & set(run_ids)) - - else: - dist_tie_check = true_dists[count-1] # tie check anchored at count-1 in GT dists - - set_end = gt_size - - for i in range(count, gt_size): - is_close = abs(dist_tie_check - true_dists[i] ) < 1e-6 - if not is_close: - set_end = i - break - - found_tie = set_end > count - - recall = len(set(true_ids[:set_end]) & set(run_ids)) - - return recall, found_tie - -def get_recall_values(true_nn, run_nn, count, count_ties=True): - true_ids, true_dists = true_nn - if not count_ties: - true_ids = true_ids[:, :count] - assert true_ids.shape == run_nn.shape - recalls = np.zeros(len(run_nn)) - queries_with_ties = 0 - # TODO probably not very efficient - for i in range(len(run_nn)): - if count_ties: - recalls[i], found_tie = compute_recall_with_distance_ties(true_ids[i], true_dists[i], run_nn[i], count) - if found_tie: queries_with_ties += 1 - else: - recalls[i] = compute_recall_without_distance_ties(true_ids[i], run_nn[i], count) - return (np.mean(recalls) / float(count), - np.std(recalls) / float(count), - recalls, - queries_with_ties) - -def knn(true_nn, run_nn, count, metrics): - if 'knn' not in metrics: - print('Computing knn metrics') - knn_metrics = metrics.create_group('knn') - mean, std, recalls, queries_with_ties = get_recall_values(true_nn, run_nn, count) - if queries_with_ties>0: - print("Warning: %d/%d queries contained ties accounted for in recall" % (queries_with_ties, len(run_nn))) - knn_metrics.attrs['mean'] = mean - knn_metrics.attrs['std'] = std - knn_metrics['recalls'] = recalls - else: - print("Found cached result") - return metrics['knn'] - -def ap(true_nn, run_nn, metrics): - if'ap' not in metrics: - print('Computing ap metrics') - gt_nres, gt_I, gt_D = true_nn - nq = gt_nres.shape[0] - gt_lims = np.zeros(nq + 1, dtype=int) - gt_lims[1:] = np.cumsum(gt_nres) - ap = compute_AP((gt_lims, gt_I, gt_D), run_nn) - ap_metric = metrics.create_group('ap') - ap_metric.attrs['mean'] = ap - else: - print("Found cached result") - return metrics['ap'].attrs['mean'] - -def queries_per_second(nq, attrs): - return nq / attrs["best_search_time"] - - -def index_size(attrs): - return attrs.get("index_size", 0) - - -def build_time(attrs): - return attrs.get("build_time", 1e6) - - -def dist_computations(nq, attrs): - return attrs.get("dist_comps", 0) / (attrs['run_count'] * nq) - -def watt_seconds_per_query(queries, attrs): - return power_capture.compute_watt_seconds_per_query(queries, attrs ) - -def mean_ssd_ios(attrs): - return attrs.get("mean_ssd_ios", 0) - -def mean_latency(attrs): - return attrs.get("mean_latency", 0) - -all_metrics = { - "k-nn": { - "description": "Recall", - "function": lambda true_nn, run_nn, metrics, run_attrs: knn(true_nn, run_nn, run_attrs["count"], metrics).attrs['mean'], # noqa - "worst": float("-inf"), - "lim": [0.0, 1.03], - }, - "ap": { - "description": "Average Precision", - "function": lambda true_nn, run_nn, metrics, run_attrs: ap(true_nn, run_nn, metrics), # noqa - "worst": float("-inf"), - "lim": [0.0, 1.03], - "search_type" : "range", - }, - "qps": { - "description": "Queries per second (1/s)", - "function": lambda true_nn, run_nn, metrics, run_attrs: queries_per_second(len(true_nn[0]), run_attrs), # noqa - "worst": float("-inf") - }, - "distcomps": { - "description": "Distance computations", - "function": lambda true_nn, run_nn, metrics, run_attrs: dist_computations(len(true_nn[0]), run_attrs), # noqa - "worst": float("inf") - }, - "build": { - "description": "Build time (s)", - "function": lambda true_nn, run_nn, metrics, run_attrs: build_time(run_attrs), # noqa - "worst": float("inf") - }, - "indexsize": { - "description": "Index size (kB)", - "function": lambda true_nn, run_nn, metrics, run_attrs: index_size(run_attrs), # noqa - "worst": float("inf") - }, - "queriessize": { - "description": "Index size (kB)/Queries per second (s)", - "function": lambda true_nn, run_nn, metrics, run_attrs: index_size(run_attrs) / queries_per_second(len(true_nn[0]), run_attrs), # noqa - "worst": float("inf") - }, - "wspq": { - "description": "Watt seconds per query (watt*s/query)", - "function": lambda true_nn, run_nn, metrics, run_attrs: watt_seconds_per_query(true_nn, run_attrs), - "worst": float("-inf") - }, - "mean_ssd_ios": { - "description": "Average SSD I/Os per query", - "function": lambda true_nn, run_nn, metrics, run_attrs: mean_ssd_ios(run_attrs), - "worst": float("inf") - }, - "mean_latency": { - "description": "Mean latency across queries", - "function": lambda true_nn, run_nn, metrics, run_attrs: mean_latency(run_attrs), - "worst": float("inf") - }, - "search_times": { - "description": "List of consecutive search times for the same run parameter", - "function": lambda true_nn, run_nn, metrics, run_attrs: run_attrs.get("search_times",[]), - "worst": float("inf") - }, - -} diff --git a/benchmark/plotting/plot_variants.py b/benchmark/plotting/plot_variants.py deleted file mode 100644 index 2a1743e98..000000000 --- a/benchmark/plotting/plot_variants.py +++ /dev/null @@ -1,10 +0,0 @@ -from benchmark.plotting.metrics import all_metrics as metrics - -all_plot_variants = { - "recall/time": ("k-nn", "qps"), - "recall/buildtime": ("k-nn", "build"), - "recall/indexsize": ("k-nn", "indexsize"), - "recall/distcomps": ("k-nn", "distcomps"), - "recall/candidates": ("k-nn", "candidates"), - "recall/qpssize": ("k-nn", "queriessize"), -} diff --git a/benchmark/plotting/utils.py b/benchmark/plotting/utils.py deleted file mode 100644 index bcfe8ead3..000000000 --- a/benchmark/plotting/utils.py +++ /dev/null @@ -1,194 +0,0 @@ -from __future__ import absolute_import - -import itertools -import numpy -from benchmark.plotting.metrics import all_metrics as metrics -from benchmark.sensors.power_capture import power_capture -import traceback -import sys - -def get_or_create_metrics(run): - if 'metrics' not in run: - run.create_group('metrics') - return run['metrics'] - - -def create_pointset(data, xn, yn): - xm, ym = (metrics[xn], metrics[yn]) - rev_y = -1 if ym["worst"] < 0 else 1 - rev_x = -1 if xm["worst"] < 0 else 1 - data.sort(key=lambda t: (rev_y * t[-1], rev_x * t[-2])) - - axs, ays, als = [], [], [] - # Generate Pareto frontier - xs, ys, ls = [], [], [] - last_x = xm["worst"] - comparator = ((lambda xv, lx: xv > lx) - if last_x < 0 else (lambda xv, lx: xv < lx)) - for algo, algo_name, xv, yv in data: - if not xv or not yv: - continue - axs.append(xv) - ays.append(yv) - als.append(algo_name) - if comparator(xv, last_x): - last_x = xv - xs.append(xv) - ys.append(yv) - ls.append(algo_name) - return xs, ys, ls, axs, ays, als - - -def compute_metrics(true_nn, res, metric_1, metric_2, - recompute=False): - all_results = {} - for i, (properties, run) in enumerate(res): - algo = properties['algo'] - algo_name = properties['name'] - # cache indices to avoid access to hdf5 file - if metric_1 == "ap" or metric_2 == "ap": - run_nn = (numpy.array(run['lims']), - numpy.array(run['neighbors']), - numpy.array(run['distances'])) - else: - run_nn = numpy.array(run['neighbors']) - if recompute and 'metrics' in run: - del run['metrics'] - metrics_cache = get_or_create_metrics(run) - - metric_1_value = metrics[metric_1]['function']( - true_nn, run_nn, metrics_cache, properties) - metric_2_value = metrics[metric_2]['function']( - true_nn, run_nn, metrics_cache, properties) - - print('%3d: %80s %12.3f %12.3f' % - (i, algo_name, metric_1_value, metric_2_value)) - - all_results.setdefault(algo, []).append( - (algo, algo_name, metric_1_value, metric_2_value)) - - return all_results - -def compute_metrics_all_runs(dataset, res, recompute=False, - sensor_metrics=False, search_times=False, - private_query=False): - - try: - if private_query: - true_nn = dataset.get_private_groundtruth() - else: - true_nn = dataset.get_groundtruth() - except: - print(f"Groundtruth for {dataset} not found.") - #traceback.print_exc() - return - - search_type = dataset.search_type() - for i, (properties, run) in enumerate(res): - algo = properties['algo'] - algo_name = properties['name'] - # cache distances to avoid access to hdf5 file - if search_type == "knn": - run_nn = numpy.array(run['neighbors']) - elif search_type == "range": - run_nn = (numpy.array(run['lims']), - numpy.array(run['neighbors']), - numpy.array(run['distances'])) - if recompute and 'metrics' in run: - print('Recomputing metrics, clearing cache') - del run['metrics'] - metrics_cache = get_or_create_metrics(run) - - dataset = properties['dataset'] - try: - dataset = dataset.decode() - algo = algo.decode() - algo_name = algo_name.decode() - except: - pass - - run_result = { - 'algorithm': algo, - 'parameters': algo_name, - 'dataset': dataset, - 'count': properties['count'], - } - for name, metric in metrics.items(): - if search_type == "knn" and name == "ap" or\ - search_type == "range" and name == "k-nn": - continue - if not sensor_metrics and name=="wspq": #don't process power sensor_metrics by default - continue - if not search_times and name=="search_times": #don't process search_times by default - continue - v = metric["function"](true_nn, run_nn, metrics_cache, properties) - run_result[name] = v - yield run_result - -#def compute_all_metrics(true_nn, run, properties, recompute=False): -# algo = properties["algo"] -# algo_name = properties["name"] -# print('--') -# print(algo_name) -# results = {} -# # cache nn to avoid access to hdf5 file -# run_nn = numpy.array(run["neighbors"]) -# if recompute and 'metrics' in run: -# del run['metrics'] -# metrics_cache = get_or_create_metrics(run) -# -# for name, metric in metrics.items(): -# v = metric["function"]( -# true_nn, run_nn, metrics_cache, properties) -# results[name] = v -# if v: -# print('%s: %g' % (name, v)) -# return (algo, algo_name, results) -# - -def generate_n_colors(n): - vs = numpy.linspace(0.3, 0.9, 7) - colors = [(.9, .4, .4, 1.)] - - def euclidean(a, b): - return sum((x - y)**2 for x, y in zip(a, b)) - while len(colors) < n: - new_color = max(itertools.product(vs, vs, vs), - key=lambda a: min(euclidean(a, b) for b in colors)) - colors.append(new_color + (1.,)) - return colors - - -def create_linestyles(unique_algorithms): - colors = dict( - zip(unique_algorithms, generate_n_colors(len(unique_algorithms)))) - linestyles = dict((algo, ['--', '-.', '-', ':'][i % 4]) - for i, algo in enumerate(unique_algorithms)) - markerstyles = dict((algo, ['+', '<', 'o', '*', 'x'][i % 5]) - for i, algo in enumerate(unique_algorithms)) - faded = dict((algo, (r, g, b, 0.3)) - for algo, (r, g, b, a) in colors.items()) - return dict((algo, (colors[algo], faded[algo], - linestyles[algo], markerstyles[algo])) - for algo in unique_algorithms) - - -def get_up_down(metric): - if metric["worst"] == float("inf"): - return "down" - return "up" - - -def get_left_right(metric): - if metric["worst"] == float("inf"): - return "left" - return "right" - - -def get_plot_label(xm, ym): - template = ("%(xlabel)s-%(ylabel)s tradeoff - %(updown)s and" - " to the %(leftright)s is better") - return template % {"xlabel": xm["description"], - "ylabel": ym["description"], - "updown": get_up_down(ym), - "leftright": get_left_right(xm)} diff --git a/benchmark/results.py b/benchmark/results.py deleted file mode 100644 index ff2ec5ee6..000000000 --- a/benchmark/results.py +++ /dev/null @@ -1,78 +0,0 @@ -from __future__ import absolute_import - -import h5py -import json -import os -import re -import traceback - - -def get_result_filename(dataset=None, count=None, definition=None, - query_arguments=None): - d = ['results'] - if dataset: - d.append(dataset) - if count: - d.append(str(count)) - if definition: - d.append(definition.algorithm) - build_args = definition.arguments - try: - for args in build_args: - if type(args) == dict and 'indexkey' in args: - build_args = [args['indexkey']] - except: - pass - data = build_args + query_arguments - data = re.sub(r'\W+', '_', json.dumps(data, sort_keys=True)).strip('_') - if len(data) > 150: - data = data[-149:] - d.append(data) - - return os.path.join(*d) - - -def store_results(dataset, count, definition, query_arguments, - attrs, results, search_type): - fn = get_result_filename( - dataset, count, definition, query_arguments) + '.hdf5' - head, tail = os.path.split(fn) - if not os.path.isdir(head): - os.makedirs(head) - f = h5py.File(fn, 'w') - for k, v in attrs.items(): - f.attrs[k] = v - if search_type == "knn": - neighbors = f.create_dataset('neighbors', (len(results), count), 'i') - for i, idxs in enumerate(results): - neighbors[i] = idxs - elif search_type == "range": - lims, D, I= results - f.create_dataset('neighbors', data=I) - f.create_dataset('lims', data=lims) - f.create_dataset('distances', data=D) - else: - raise NotImplementedError() - f.close() - - -def load_all_results(dataset=None, count=None): - """ - A generator for all result files. - """ - for root, _, files in os.walk(get_result_filename(dataset, count)): - for fn in files: - if os.path.splitext(fn)[-1] != '.hdf5': - continue - try: - f = h5py.File(os.path.join(root, fn), 'r+') - properties = dict(f.attrs) - yield properties, f - f.close() - except: - print('Was unable to read', fn) - traceback.print_exc() - - -def get_unique_algorithms(): - return set(properties['algo'] for properties, _ in load_all_results()) diff --git a/benchmark/runner.py b/benchmark/runner.py deleted file mode 100644 index 1218d8e88..000000000 --- a/benchmark/runner.py +++ /dev/null @@ -1,351 +0,0 @@ -import argparse -import json -import logging -import os -import threading -import time -import traceback - -import colors -import docker -import numpy -import psutil - -from benchmark.algorithms.definitions import (Definition, - instantiate_algorithm) - -from benchmark.datasets import DATASETS, upload_accelerated, download_accelerated -from benchmark.results import store_results - -from benchmark.sensors.power_capture import power_capture -from benchmark.t3.helper import t3_create_container - -def run_individual_query(algo, X, distance, count, run_count, search_type): - best_search_time = float('inf') - search_times = [] - for i in range(run_count): - print('Run %d/%d...' % (i + 1, run_count)) - - start = time.time() - if search_type == "knn": - algo.query(X, count) - total = (time.time() - start) - results = algo.get_results() - assert len(results) == len(X) - else: - algo.range_query(X, count) - total = (time.time() - start) - results = algo.get_range_results() - - search_time = total - best_search_time = min(best_search_time, search_time) - search_times.append( search_time ) - - attrs = { - "best_search_time": best_search_time, - "name": str(algo), - "run_count": run_count, - "distance": distance, - "type": search_type, - "count": int(count), - "search_times": search_times - } - additional = algo.get_additional() - for k in additional: - attrs[k] = additional[k] - return (attrs, results) - -def run(definition, dataset, count, run_count, rebuild, - upload_index=False, download_index=False, - blob_prefix="", sas_string="", private_query=False): - - algo = instantiate_algorithm(definition) - assert not definition.query_argument_groups \ - or hasattr(algo, "set_query_arguments"), """\ -error: query argument groups have been specified for %s.%s(%s), but the \ -algorithm instantiated from it does not implement the set_query_arguments \ -function""" % (definition.module, definition.constructor, definition.arguments) - - assert not upload_index or not download_index - - ds = DATASETS[dataset]() - #X_train = numpy.array(D['train']) - if not private_query: - X = ds.get_queries() - else: - X = ds.get_private_queries() - distance = ds.distance() - search_type = ds.search_type() - print(f"Running {definition.algorithm} on {dataset}") - print(fr"Got {len(X)} queries") - - try: - # Try loading the index from the file - memory_usage_before = algo.get_memory_usage() - if download_index: - local_dir, index_prefix, components = algo.index_files_to_store(dataset) - remote_location = blob_prefix + '/' + algo.track() + '/' + algo.__str__() + '/' + DATASETS[dataset]().short_name() + '/' - for component in components: - download_accelerated(remote_location + index_prefix + component, - local_dir + '/' + index_prefix + component, - False, sas_string) - print("Index files downloaded.") - if algo.load_index(dataset): - print("Index loaded.") - else: - print("Index load failed.") - elif rebuild or not algo.load_index(dataset): - # Build the index if it is not available - t0 = time.time() - algo.fit(dataset) - build_time = time.time() - t0 - print('Built index in', build_time) - else: - print("Loaded existing index") - - - index_size = algo.get_memory_usage() - memory_usage_before - print('Index memory footprint: ', index_size) - - if upload_index: - print("Starting index upload...") - local_dir, index_prefix, components = algo.index_files_to_store(dataset) - remote_location = blob_prefix + '/' + algo.track() + '/' + algo.__str__() + '/' + DATASETS[dataset]().short_name() - for component in components: - upload_accelerated(local_dir, remote_location, - index_prefix + component, sas_string) - else: - print("Starting query") - query_argument_groups = definition.query_argument_groups - # Make sure that algorithms with no query argument groups still get run - # once by providing them with a single, empty, harmless group - if not query_argument_groups: - query_argument_groups = [[]] - - for pos, query_arguments in enumerate(query_argument_groups, 1): - print("Running query argument group %d of %d..." % - (pos, len(query_argument_groups))) - if query_arguments: - algo.set_query_arguments(*query_arguments) - descriptor, results = run_individual_query( - algo, X, distance, count, run_count, search_type) - # A bit unclear how to set this correctly if we usually load from file - #descriptor["build_time"] = build_time - descriptor["index_size"] = index_size - descriptor["algo"] = definition.algorithm - descriptor["dataset"] = dataset - if power_capture.enabled(): - power_stats = power_capture.run(algo, X, distance, count, - run_count, search_type, descriptor) - - store_results(dataset, count, definition, - query_arguments, descriptor, results, search_type) - finally: - algo.done() - - -def run_from_cmdline(args=None): - parser = argparse.ArgumentParser(''' - - NOTICE: You probably want to run.py rather than this script. - -''') - parser.add_argument( - '--dataset', - choices=DATASETS.keys(), - help=f'Dataset to benchmark on.', - required=True) - parser.add_argument( - '--algorithm', - help='Name of algorithm for saving the results.', - required=True) - parser.add_argument( - '--module', - help='Python module containing algorithm. E.g. "ann_benchmarks.algorithms.annoy"', - required=True) - parser.add_argument( - '--constructor', - help='Constructer to load from module. E.g. "Annoy"', - required=True) - parser.add_argument( - '--count', - help='k: Number of nearest neighbours for the algorithm to return.', - required=True, - type=int) - parser.add_argument( - '--rebuild', - help='re-build index even if it exists', - action='store_true') - parser.add_argument( - '--runs', - help='Number of times to run the algorihm. Will use the fastest run-time over the bunch.', - required=True, - type=int) - parser.add_argument( - 'build', - help='JSON of arguments to pass to the constructor. E.g. ["angular", 100]' - ) - parser.add_argument( - 'queries', - help='JSON of arguments to pass to the queries. E.g. [100]', - nargs='*', - default=[]) - parser.add_argument( - '--power-capture', - help='Power capture parameters for the T3 competition. ' - 'Format is "ip:port:capture_time_in_seconds (ie, 127.0.0.1:3000:10).', - default="") - parser.add_argument( - '--upload-index', - help='Upload index to cloud storage.', - action='store_true') - parser.add_argument( - '--download-index', - help='Download index from cloud storage.', - action='store_true') - parser.add_argument( - '--blob-prefix', - help='Azure blob prefix to upload index to or download index from.') - parser.add_argument( - '--sas-string', - help='SAS string to authenticate to Azure blob storage.') - parser.add_argument( - '--private-query', - help='Use the new set of private queries that were not released during the competition period.', - action="store_true") - - args = parser.parse_args(args) - algo_args = json.loads(args.build) - print(algo_args) - query_args = [json.loads(q) for q in args.queries] - - if args.power_capture: - power_capture( args.power_capture ) - power_capture.ping() - - definition = Definition( - algorithm=args.algorithm, - docker_tag=None, # not needed - module=args.module, - constructor=args.constructor, - arguments=algo_args, - query_argument_groups=query_args, - disabled=False - ) - run(definition, args.dataset, args.count, args.runs, args.rebuild, - args.upload_index, args.download_index, args.blob_prefix, args.sas_string, - args.private_query) - - -def run_docker(definition, dataset, count, runs, timeout, rebuild, - cpu_limit, mem_limit=None, t3=None, power_capture=None, - upload_index=False, download_index=False, - blob_prefix="", sas_string="", private_query=False): - cmd = ['--dataset', dataset, - '--algorithm', definition.algorithm, - '--module', definition.module, - '--constructor', definition.constructor, - '--runs', str(runs), - '--count', str(count)] - if power_capture: - cmd += ["--power-capture", power_capture ] - if rebuild: - cmd.append("--rebuild") - if upload_index: - cmd.append("--upload-index") - cmd += ["--blob-prefix", blob_prefix] - cmd += ["--sas-string", sas_string] - if download_index: - cmd.append("--download-index") - cmd += ["--blob-prefix", blob_prefix] - cmd += ["--sas-string", sas_string] - if private_query==True: - cmd.append("--private-query") - - cmd.append(json.dumps(definition.arguments)) - cmd += [json.dumps(qag) for qag in definition.query_argument_groups] - - client = docker.from_env() - if mem_limit is None: - mem_limit = psutil.virtual_memory().available - - - container = None - if t3: - container = t3_create_container(definition, cmd, cpu_limit, mem_limit ) - timeout = 3600*24*3 # 3 days - print("Setting container wait timeout to 3 days") - - else: - container = client.containers.run( - definition.docker_tag, - cmd, - volumes={ - os.path.abspath('benchmark'): - {'bind': '/home/app/benchmark', 'mode': 'ro'}, - os.path.abspath('data'): - {'bind': '/home/app/data', 'mode': 'rw'}, - os.path.abspath('results'): - {'bind': '/home/app/results', 'mode': 'rw'}, - }, - cpuset_cpus=cpu_limit, - mem_limit=mem_limit, - detach=True) - - logger = logging.getLogger(f"annb.{container.short_id}") - - logger.info('Created container %s: CPU limit %s, mem limit %s, timeout %d, command %s' % \ - (container.short_id, cpu_limit, mem_limit, timeout, cmd)) - - def stream_logs(): - for line in container.logs(stream=True): - logger.info(colors.color(line.decode().rstrip(), fg='blue')) - - t = threading.Thread(target=stream_logs, daemon=True) - t.start() - - try: - exit_code = container.wait(timeout=timeout) - - # Exit if exit code - if exit_code not in [0, None]: - logger.error(colors.color(container.logs().decode(), fg='red')) - logger.error('Child process for container %s raised exception %d' % (container.short_id, exit_code)) - except: - logger.error('Container.wait for container %s failed with exception' % container.short_id) - logger.error('Invoked with %s' % cmd) - traceback.print_exc() - finally: - container.remove(force=True) - - -def run_no_docker(definition, dataset, count, runs, timeout, rebuild, - cpu_limit, mem_limit=None, t3=False, power_capture=None, - upload_index=False, download_index=False, - blob_prefix="", sas_string="", private_query=False): - cmd = ['--dataset', dataset, - '--algorithm', definition.algorithm, - '--module', definition.module, - '--constructor', definition.constructor, - '--runs', str(runs), - '--count', str(count)] - if power_capture: - cmd += ["--power-capture", power_capture ] - if rebuild: - cmd.append("--rebuild") - if upload_index: - cmd.append("--upload-index") - cmd += ["--blob-prefix", blob_prefix] - cmd += ["--sas-string", sas_string] - if download_index: - cmd.append("--download-index") - cmd += ["--blob-prefix", blob_prefix] - cmd += ["--sas-string", sas_string] - if private_query==True: - cmd.append("--private-query") - - cmd.append(json.dumps(definition.arguments)) - cmd += [json.dumps(qag) for qag in definition.query_argument_groups] - run_from_cmdline(cmd) - - diff --git a/benchmark/sensors/power_capture.py b/benchmark/sensors/power_capture.py deleted file mode 100644 index 664c39746..000000000 --- a/benchmark/sensors/power_capture.py +++ /dev/null @@ -1,248 +0,0 @@ -import requests -import uuid -import json -import time -import statistics -import math - -class power_capture: - - """ - This singleton class provides various capabilites related to the T3 track - of the Big ANN Competition for NeurIPS 2021: - * communicates with an ipmicap server ( see http://github.com/fractalsproject/ipmicap ) - * leverage's servers power sensor capture abilities - * retrieves power statistics computed by the server - """ - - ipmicap_ip = None - ipmicap_port = None - min_capture_time = None - raise_exc_on_fail = None - - @classmethod - def __init__(cls, packed_parm, raise_exc_on_fail=True): - - parms = packed_parm.split(":") - ipmicap_ip = parms[0] - ipmicap_port = int(parms[1]) - min_capture_time = float(parms[2]) - cls.ipmicap_ip = ipmicap_ip - cls.ipmicap_port = ipmicap_port - cls.min_capture_time = min_capture_time - cls.raise_exc_on_fail = raise_exc_on_fail - - @classmethod - def _send_msg_to_ipmicap_server(cls, uri, parms): - url = "http://%s:%d/%s" % (cls.ipmicap_ip,cls.ipmicap_port,uri) - resp = requests.get(url,parms) - if resp.status_code!=200: - msg = "T3: Failed to ping ipmicapserver." - if cls.raise_exc_on_fail: - raise Exception(msg) - else: - print("Power: Failed to ping ipmicap server.") - return False - else: - ret_json = resp.json() - return resp.json() - - @classmethod - def enabled(cls): - """ - Returns True if this singleton class has been initialized. - """ - if cls.ipmicap_ip != None: - return True - else: - return False - - @classmethod - def ping(cls): - """ - Ping the IPMICAP server and make sure it's running. - """ - return cls._send_msg_to_ipmicap_server("log",{"ping":1}) - - @classmethod - def start(cls): - """ - Start power capture at the IPMI server. - """ - session_id = str(uuid.uuid4()) - status = cls._send_msg_to_ipmicap_server("session", - {"start":1,"id":session_id}) - if status: - return session_id - else: - return False - - @classmethod - def stop(cls, session_id, all_stats=False): - """ - End power capture at the IPMI server for the session - and returm the computed power consumption. - """ - stop_parm = "all_stats" if all_stats else 1 - power_stats = cls._send_msg_to_ipmicap_server("session", - {"stop":stop_parm, "id": session_id}) - if power_stats: - return power_stats - else: - return False - - @classmethod - def get_stats(cls, session_ids): - """ - Retrieve power capture statistics for capture ids supplied. - """ - raise Exception("Not implemented.") - - @classmethod - def run_has_power_stats(cls, properties): - """ - Determines if the benchmark run has power related metrics. - """ - if "power_consumption" in properties: return True - else: return False - - @classmethod - def detect_power_benchmarks(cls, metrics, res): - """ - Adjust the global metrics based on the availability of - power related benchmarks in the loaded results. - """ - has_power_benchmarks = False - for i, (properties, run) in enumerate(res): - if cls.run_has_power_stats(properties): - has_power_benchmarks = True - break - if has_power_benchmarks: - return True - else: # no power benchmarks and not required, just remove from global benchmarks - #print("Ignoring the global 'wspq' metric because no power benchmarks are present.") - metrics.pop("wspq", None) - return True - - @classmethod - def detect_power_benchmarks_for_plot(cls, args, res ): - """ - If power benchmarks are requested for plot but now power benchmarks are - not present then return False. - """ - required = args.x_axis=='wspq' or args.y_axis=='wspq' - if not required: - return True - - has_power_benchmarks = False - for i, (properties, run) in enumerate(res): - if cls.run_has_power_stats(properties): - has_power_benchmarks = True - break - if has_power_benchmarks and required: return True - else: - print("No power benchmarks found in loaded results.") - return False - - - @classmethod - def compute_watt_seconds_per_query(cls, queries, attrs ): - """ - Retreive the benchmark metric wspq. - """ - return attrs["best_wspq"] - - @classmethod - def run(cls, algo, X, distance, count, run_count, search_type, descriptor ): - """The runner for power consumption is slightly different than the default runner.""" - - capture_time = power_capture.min_capture_time - best_search_time = descriptor["best_search_time"] - - inner_run_count = math.ceil(capture_time/best_search_time) if capture_time > best_search_time else 1 - - print('Run for power capture with %d iterations (via %d/%f) for %d iterations' - % (inner_run_count, capture_time, best_search_time, run_count ) ) - - cap_ids = [] - power_run_counts = [] - power_run_times = [] - power_consumptions = [] - power_tot_queries = [] - - best_power_cons = float('inf') - for i in range(run_count): - cap_id = cls.start() - start = time.time() - for i in range(inner_run_count): - if search_type == "knn": - algo.query(X, count) - else: - algo.range_query(X, count) - total = (time.time() - start) - power_stats = cls.stop(cap_id, all_stats=True) - power_cons = power_stats['tot_power'] - tot_queries = inner_run_count * X.shape[0] - - # Track the best one thus far - best_power_cons = min(best_power_cons, power_cons) - best_tot_queries = tot_queries # Although its always the same now, we may change that - - cap_ids.append(cap_id) - power_run_counts.append( inner_run_count ) - power_run_times.append( total ) - power_consumptions.append( power_cons ) - power_tot_queries.append( tot_queries ) - - power_cons_mean = statistics.mean( power_consumptions ) - power_cons_stdev = statistics.stdev( power_consumptions ) - best_wspq = best_power_cons/best_tot_queries - mean_wspq = power_cons_mean/best_tot_queries - print("wspq: best=%f mean=%f best_tot_queries=%d" % (best_wspq, mean_wspq, best_tot_queries)) - power_stats = {"power_cap_id": cap_ids, - "power_run_count": power_run_counts, - "power_run_time": power_run_times, - "power_consumption":power_consumptions, - "best_power_consumption": best_power_cons, - "inner_run_count": inner_run_count, - "power_consumption_mean": power_cons_mean, - "power_consumption_stdev": power_cons_stdev, - "best_wspq": best_wspq, - "mean_wspq": mean_wspq } - - for k in power_stats.keys(): - descriptor[k] = power_stats[k] - - -# -# To run these unit tests for the power_capture class, type 'python power_capture.py' -# -if __name__ == "__main__": - - print("power capture unit tests") - - ipmicap_ip = "192.168.99.112" # Set to your ipmicap's server ip - ipmicap_port = 3000 # Set to your ipmicap's server port - min_capture_time = -1 - - #power_capture( ipmicap_ip, ipmicap_port, min_capture_time ) - power_capture( "%s:%d:%f" % (ipmicap_ip, ipmicap_port, min_capture_time )) - - print("pinging ipmicap server at %s:%d" % (power_capture.ipmicap_ip, - power_capture.ipmicap_port)) - power_capture.ping() - - print("enabled=", power_capture.enabled()) - - print("start") - cid=power_capture.start() - print("cid=",cid) - - print("stop") - power_capture.stop() - - stats = power_capture.get_stats([cid]) - print("stats=",stats) - - print("all tests passed.") - diff --git a/benchmark/t3/__init__.py b/benchmark/t3/__init__.py deleted file mode 100644 index c3961685a..000000000 --- a/benchmark/t3/__init__.py +++ /dev/null @@ -1 +0,0 @@ -from __future__ import absolute_import diff --git a/benchmark/t3/helper.py b/benchmark/t3/helper.py deleted file mode 100644 index 2a83550fd..000000000 --- a/benchmark/t3/helper.py +++ /dev/null @@ -1,111 +0,0 @@ -import os -import docker - -from benchmark.datasets import DATASETS, BigANNDataset - -def print_cuda_versions(): - info = subprocess.check_output(['nvidia-smi', '--query-gpu=driver_version','--format=csv']) - print(info) - info = subprocess.check_output(['nvcc', '--version']) - print(info) - - -def t3_create_container( definition, cmd, cpu_limit, mem_limit): - - if definition.algorithm in [ 'faiss-t3' ]: - - print("Launching GPU container") - container = create_container_with_gpu_support( - docker.from_env(), - definition.docker_tag, - cmd, - volumes={ - os.path.abspath('benchmark'): - {'bind': '/home/app/benchmark', 'mode': 'ro'}, - os.path.abspath('data'): - {'bind': '/home/app/data', 'mode': 'rw'}, - os.path.abspath('results'): - {'bind': '/home/app/results', 'mode': 'rw'}, - }, - cpuset_cpus=cpu_limit, - mem_limit=mem_limit, - detach=True) - container.start() - return container - - else: - raise Exception("Docker invoke not supported for this algorithm.") - -def create_container_with_gpu_support(client, image, command, volumes, **kwargs): - - - from docker.models.images import Image - from docker.models.containers import _create_container_args - - if isinstance(image, Image): - image = image.id - - os.environ['NVIDIA_VISIBLE_DEVICES']='all' - - kwargs['image'] = image - kwargs['command'] = command - kwargs['version'] = client.containers.client.api._version - kwargs['volumes'] = volumes - create_kwargs = _create_container_args(kwargs) - - device_request = { - 'Driver': 'nvidia', - 'Capabilities': [['gpu'], ['nvidia']], - 'Count': -1, # enable all gpus - } - - if device_request is not None: - create_kwargs['host_config']['DeviceRequests'] = [device_request] - - resp = client.api.create_container(**create_kwargs) - return client.containers.get(resp['Id']) - -def create_container_with_network_host_support(client, image, command, volumes, **kwargs): - - kwargs['image'] = image - kwargs['command'] = command - kwargs['version'] = client.containers.client.api._version - kwargs['volumes'] = volumes - kwargs['network'] = "host" - create_kwargs = _create_container_args(kwargs) - - resp = client.api.create_container(**create_kwargs) - return client.containers.get(resp['Id']) - - -class BigANNDatasetAngular(BigANNDataset): - - def __init__(self, *args, **kwargs): - ret = super().__init__(*args, **kwargs) - if self.gt_fn: - print("You must compute and replace the ground truth file here:", self.gt_fn ) - else: - gt_fn = self._form_gt_fn() - if os.path.exists( os.path.join( self.basedir, gt_fn)): - #print("file %s already exists" % gt_fn ) - self.gt_fn = gt_fn - else: - print("You must compute the ground and create the file in here:", - os.path.join( self.basedir, gt_fn ) ) - return ret - - def _form_gt_fn(self): - gt_fn = "gt_angular.ibin" - print("ds", self.ds_fn, self.nb, 10**9) - if self.nb < 10**9: - gt_fn += ".crop_nb_%d" % ( self.nb ) - return gt_fn - - def get_groundtruth(self, *args, **kwargs): - self.gt_fn = self.gt_fn - return super().get_groundtruth(*args, **kwargs) - - def distance(self): - return "angular" - - diff --git a/cmt_logo.png b/cmt_logo.png new file mode 100644 index 000000000..4ad6a8404 Binary files /dev/null and b/cmt_logo.png differ diff --git a/create_dataset.py b/create_dataset.py deleted file mode 100644 index bc8062943..000000000 --- a/create_dataset.py +++ /dev/null @@ -1,16 +0,0 @@ -import argparse -from benchmark.datasets import DATASETS - -if __name__ == "__main__": - parser = argparse.ArgumentParser() - parser.add_argument( - '--dataset', - choices=DATASETS.keys(), - required=True) - parser.add_argument( - '--skip-data', - action='store_true', - help='skip downloading base vectors') - args = parser.parse_args() - ds = DATASETS[args.dataset]() - ds.prepare(True if args.skip_data else False) diff --git a/create_website.py b/create_website.py deleted file mode 100644 index 5c90304de..000000000 --- a/create_website.py +++ /dev/null @@ -1,278 +0,0 @@ -import matplotlib as mpl -mpl.use('Agg') # noqa -import argparse -import os -import json -import pickle -import yaml -import numpy -import hashlib -from jinja2 import Environment, FileSystemLoader - -from benchmark import results -#from benchmark.datasets import get_dataset -from benchmark.plotting.plot_variants import (all_plot_variants - as plot_variants) -from benchmark.plotting.metrics import all_metrics as metrics -from benchmark.plotting.utils import (get_plot_label, compute_metrics, - compute_metrics_all_runs, - create_pointset, - create_linestyles) -import plot - -colors = [ - "rgba(166,206,227,1)", - "rgba(31,120,180,1)", - "rgba(178,223,138,1)", - "rgba(51,160,44,1)", - "rgba(251,154,153,1)", - "rgba(227,26,28,1)", - "rgba(253,191,111,1)", - "rgba(255,127,0,1)", - "rgba(202,178,214,1)" -] - -point_styles = { - "o": "circle", - "<": "triangle", - "*": "star", - "x": "cross", - "+": "rect", -} - - -def convert_color(color): - r, g, b, a = color - return "rgba(%(r)d, %(g)d, %(b)d, %(a)d)" % { - "r": r * 255, "g": g * 255, "b": b * 255, "a": a} - - -def convert_linestyle(ls): - new_ls = {} - for algo in ls.keys(): - algostyle = ls[algo] - new_ls[algo] = (convert_color(algostyle[0]), - convert_color(algostyle[1]), - algostyle[2], point_styles[algostyle[3]]) - return new_ls - - -def get_run_desc(properties): - return "%(dataset)s_%(count)d_%(distance)s" % properties - - -def get_dataset_from_desc(desc): - return desc.split("_")[0] - - -def get_count_from_desc(desc): - return desc.split("_")[1] - - -def get_distance_from_desc(desc): - return desc.split("_")[2] - - -def get_dataset_label(desc): - return "{} (k = {})".format(get_dataset_from_desc(desc), - get_count_from_desc(desc)) - - -def directory_path(s): - if not os.path.isdir(s): - raise argparse.ArgumentTypeError("'%s' is not a directory" % s) - return s + "/" - - -def prepare_data(data, xn, yn): - """Change format from (algo, instance, dict) to (algo, instance, x, y).""" - res = [] - for algo, algo_name, result in data: - res.append((algo, algo_name, result[xn], result[yn])) - return res - - -parser = argparse.ArgumentParser() -parser.add_argument( - '--plottype', - help='Generate only the plots specified', - nargs='*', - choices=plot_variants.keys(), - default=plot_variants.keys()) -parser.add_argument( - '--outputdir', - help='Select output directory', - default='.', - type=directory_path, - action='store') -parser.add_argument( - '--latex', - help='generates latex code for each plot', - action='store_true') -parser.add_argument( - '--scatter', - help='create scatterplot for data', - action='store_true') -parser.add_argument( - '--recompute', - help='Clears the cache and recomputes the metrics', - action='store_true') -args = parser.parse_args() - - -def get_lines(all_data, xn, yn, render_all_points): - """ For each algorithm run on a dataset, obtain its performance - curve coords.""" - plot_data = [] - for algo in sorted(all_data.keys(), key=lambda x: x.lower()): - xs, ys, ls, axs, ays, als = \ - create_pointset(prepare_data(all_data[algo], xn, yn), xn, yn) - if render_all_points: - xs, ys, ls = axs, ays, als - plot_data.append({"name": algo, "coords": zip(xs, ys), "labels": ls, - "scatter": render_all_points}) - return plot_data - - -def create_plot(all_data, xn, yn, linestyle, j2_env, additional_label="", - plottype="line"): - xm, ym = (metrics[xn], metrics[yn]) - render_all_points = plottype == "bubble" - plot_data = get_lines(all_data, xn, yn, render_all_points) - latex_code = j2_env.get_template("latex.template").\ - render(plot_data=plot_data, caption=get_plot_label(xm, ym), - xlabel=xm["description"], ylabel=ym["description"]) - plot_data = get_lines(all_data, xn, yn, render_all_points) - button_label = hashlib.sha224((get_plot_label(xm, ym) + additional_label) - .encode("utf-8")).hexdigest() - return j2_env.get_template("chartjs.template").\ - render(args=args, latex_code=latex_code, button_label=button_label, - data_points=plot_data, - xlabel=xm["description"], ylabel=ym["description"], - plottype=plottype, plot_label=get_plot_label(xm, ym), - label=additional_label, linestyle=linestyle, - render_all_points=render_all_points) - - -def build_detail_site(data, label_func, j2_env, linestyles, batch=False): - for (name, runs) in data.items(): - print("Building '%s'" % name) - all_runs = runs.keys() - label = label_func(name) - data = {"normal": [], "scatter": []} - - for plottype in args.plottype: - xn, yn = plot_variants[plottype] - data["normal"].append(create_plot( - runs, xn, yn, convert_linestyle(linestyles), j2_env)) - if args.scatter: - data["scatter"].append( - create_plot(runs, xn, yn, convert_linestyle(linestyles), - j2_env, "Scatterplot ", "bubble")) - - # create png plot for summary page - data_for_plot = {} - for k in runs.keys(): - data_for_plot[k] = prepare_data(runs[k], 'k-nn', 'qps') - plot.create_plot( - data_for_plot, False, - 'linear', 'log', 'k-nn', 'qps', - args.outputdir + name + '.png', - linestyles, batch) - output_path = \ - args.outputdir + name + '.html' - with open(output_path, "w") as text_file: - text_file.write(j2_env.get_template("detail_page.html"). - render(title=label, plot_data=data, - args=args, batch=batch)) - - -def build_index_site(datasets, algorithms, j2_env, file_name): - dataset_data = {'batch': [], 'non-batch': []} - for mode in ['batch', 'non-batch']: - distance_measures = sorted( - set([get_distance_from_desc(e) for e in datasets[mode].keys()])) - sorted_datasets = sorted( - set([get_dataset_from_desc(e) for e in datasets[mode].keys()])) - - for dm in distance_measures: - d = {"name": dm.capitalize(), "entries": []} - for ds in sorted_datasets: - matching_datasets = [e for e in datasets[mode].keys() - if get_dataset_from_desc(e) == ds and # noqa - get_distance_from_desc(e) == dm] - sorted_matches = sorted( - matching_datasets, - key=lambda e: int(get_count_from_desc(e))) - for idd in sorted_matches: - d["entries"].append( - {"name": idd, "desc": get_dataset_label(idd)}) - dataset_data[mode].append(d) - - with open(args.outputdir + "index.html", "w") as text_file: - text_file.write(j2_env.get_template("summary.html"). - render(title="Big ANN Benchmarks", - dataset_with_distances=dataset_data, - algorithms=algorithms)) - - -def build_index_site_without_data(j2_env, file_name): - with open(args.outputdir + "index.html", "w") as text_file: - text_file.write(j2_env.get_template("summary.html"). - render(title="Big ANN Benchmarks")) - -# def load_all_results(): -# """Read all result files and compute all metrics""" -# all_runs_by_dataset = {'batch': {}, 'non-batch': {}} -# all_runs_by_algorithm = {'batch': {}, 'non-batch': {}} -# cached_true_dist = [] -# old_sdn = None -# for mode in ["non-batch", "batch"]: -# for properties, f in results.load_all_results(batch_mode=(mode == "batch")): -# sdn = get_run_desc(properties) -# if sdn != old_sdn: -# dataset = get_dataset(properties["dataset"]) -# cached_true_dist = list(dataset["distances"]) -# old_sdn = sdn -# algo_ds = get_dataset_label(sdn) -# desc_suffix = ("-batch" if mode == "batch" else "") -# algo = properties["algo"] + desc_suffix -# sdn += desc_suffix -# ms = compute_all_metrics( -# cached_true_dist, f, properties, args.recompute) -# all_runs_by_algorithm[mode].setdefault( -# algo, {}).setdefault(algo_ds, []).append(ms) -# all_runs_by_dataset[mode].setdefault( -# sdn, {}).setdefault(algo, []).append(ms) - -# return (all_runs_by_dataset, all_runs_by_algorithm) - - -j2_env = Environment(loader=FileSystemLoader("./templates/"), trim_blocks=True) -j2_env.globals.update(zip=zip, len=len) -#runs_by_ds, runs_by_algo = load_all_results() -# dataset_names = [get_dataset_label(x) for x in list( -# runs_by_ds['batch'].keys()) + list(runs_by_ds['non-batch'].keys())] -# algorithm_names = list(runs_by_algo['batch'].keys( -# )) + list(runs_by_algo['non-batch'].keys()) - -# linestyles = {**create_linestyles(dataset_names), -# **create_linestyles(algorithm_names)} - -# build_detail_site( -# runs_by_ds['non-batch'], -# lambda label: get_dataset_label(label), j2_env, linestyles, False) - -# build_detail_site( -# runs_by_ds['batch'], -# lambda label: get_dataset_label(label), j2_env, linestyles, True) - -# build_detail_site( -# runs_by_algo['non-batch'], -# lambda x: x, j2_env, linestyles, False) - -# build_detail_site( -# runs_by_algo['batch'], lambda x: x, j2_env, linestyles, True) - -#build_index_site(runs_by_ds, runs_by_algo, j2_env, "index.html") -build_index_site_without_data(j2_env, "index.html") diff --git a/data_export.py b/data_export.py deleted file mode 100644 index 83489c319..000000000 --- a/data_export.py +++ /dev/null @@ -1,95 +0,0 @@ -import pandas as pd -import sys -import os -import matplotlib as mpl -mpl.use('Agg') -import matplotlib.pyplot as plt -import argparse -import bz2 -import sys - -from benchmark.datasets import DATASETS -from benchmark.plotting.utils import compute_metrics_all_runs -from benchmark.results import load_all_results, get_unique_algorithms - -if __name__ == "__main__": - parser = argparse.ArgumentParser() - parser.add_argument( - '--output', - help='Path to the output csv file', - required=True) - parser.add_argument( - '--recompute', - action='store_true', - help='Path to the output csv file') - parser.add_argument( - - '--private-query', - help='Use the private queries and ground truth', - action='store_true') - parser.add_argument( - '--sensors', - action='store_true', - help='Export sensors data if available') - parser.add_argument( - '--search-times', - action='store_true', - help='Export search times data if available') - parser.add_argument( - '--detect-caching', - type=float, - default=None, - metavar="THRESHOLD", - help='Try to detect query response caching by analyzing search times. Supply a threshold betwee 0 and 1, such as 0.3.') - args = parser.parse_args() - - if args.detect_caching!=None and not args.search_times: - print("Error: --detect_caching requires the --search_times flag") - sys.exit(1) - - datasets = DATASETS.keys() - dfs = [] - - is_first = True - for dataset_name in datasets: - print("Looking at dataset", dataset_name) - dataset = DATASETS[dataset_name]() - results = load_all_results(dataset_name) - results = compute_metrics_all_runs(dataset, results, args.recompute, \ - args.sensors, args.search_times, args.private_query) - cleaned = [] - for result in results: - if 'k-nn' in result: - result['recall/ap'] = result['k-nn'] - del result['k-nn'] - if 'ap' in result: - result['recall/ap'] = result['ap'] - del result['ap'] - if args.sensors: - if 'wspq' not in result: - print('Warning: wspq sensor data not available.') - if args.search_times: - search_times = result['search_times'] - if 'search_times' in result: - # create a space separated list suitable as column for a csv - result['search_times'] = \ - " ".join( [str(el) for el in search_times ] ) - - if args.detect_caching != None: - print("%s: Checking for response caching for these search times->" % dataset_name, search_times) - percent_improvement = (search_times[0]-search_times[-1])/search_times[0] - caching = percent_improvement > args.detect_caching - result['caching'] = "%d %f %f" % ( 1 if caching else 0, args.detect_caching, percent_improvement ) - if caching: - print("Possible caching discovered: %.3f > %.3f" % ( percent_improvement, args.detect_caching) ) - else: - print("No response caching detected.") - - else: - print("Warning: 'search_times' not available.") - cleaned.append(result) - dfs.append(pd.DataFrame(cleaned)) - if len(dfs) > 0: - data = pd.concat(dfs) - data.to_csv(args.output, index=False) - diff --git a/dataset_preparation/FB_ssnpp_dataset.md b/dataset_preparation/FB_ssnpp_dataset.md deleted file mode 100644 index cac2500d1..000000000 --- a/dataset_preparation/FB_ssnpp_dataset.md +++ /dev/null @@ -1,83 +0,0 @@ -# The Facebook SimSearchNet++ dataset - -SimSearchNet++ features are extracted from the images. -In production, the features are used for image copy detection for integrity purposes. -There is some detail in [this blog post](https://ai.facebook.com/blog/using-ai-to-detect-covid-19-misinformation-and-exploitative-content) - -The SSN++ features are intially in 512 dimensions, L2-normalized and in floating-point. -They are compared with a given threshold (squared L2 < 0.8) and images are deemed to match and input to further processing if the distance between images are below that threshold. - -## Data preparation - -This dataset is built form public Instagram images from a variety of countries. -The SSN++ features extracted from the images have been de-duplicated. After deduplication about 1.17B vectors remain. - -99% of the dataset is used for the database vectors. - -1% of the dataset is set apart for queries, experiments and PCA training. - -### Selecting queries - -We randomly sample 3 sets of 1M vectors each from the 1%: A, B and C. - -A are the candidate query vectors. -We compute the exact range search matches of A into database B with threshold 0.8. -This yields 124210 results, with a distance histogram that looks like: - -![](fb_ssnpp_images/distance_histogram.png) - -The leftmost peak corresponds to very near image copies. -When the threshold is relaxed, more images get matches, and the 0.8 threshold is quite arbitrary. -With a 1B dataset the number of matches is expected to increase to 124k * 1000 = 124M matches. - -It is useful to look at the number of results per query vector and the number of database vectors that appear to be matching with a query vector: - -![](fb_ssnpp_images/result_stats.png) - -Both plots are in log-log scale and sorted by decreasing frequencies. -This way of visualizing is useful because the data distribution is very bursty: -for example, 10 query vectors get almost 100 results and fewer than 20k vectors of the 1M queries have a result at all. - -This happens often on range search with real data because (1) most images are unique (no match) and (2) there are "meme" images that are posted many times with small variations, which creates clusters of images with many matches. - -From a benchmarking point of view, memes are not interesting because they rarely appear in search results. On the other hand, vectors with no matches are relevant for applications: the ANN algorihtm should indeed be able to not retrieve anything for them. -Therefore, we do a pass to remove the candidate queries with most matches. -We arbitrarily chose a threshold of 30 matches, which reduces the number of candidate queries to 999086 and the total number of matches to 71357. - -We keep the first and second 100k of the resulting query candidates as public query set and held-out query set. - -### Compressing the dataset - -To make the dataset less bulky, the features have been reduced to 256 dimensions by PCA (trained on subset C) and encoded in uint8. -The effect of this compression is a loss of precision w.r.t. the ground-truth matches. -This means that the comparison threshold is also adjusted to a squared L2 distance. -We select the "compressed" L2 threshold as the one that maximizes the IoU of the results wrt. the float32 results. -This happens for a squared L2 threshold of **96237**. - -![](fb_ssnpp_images/IoU.png) - -The challenge ground truth is recomputed *after* compression with this threshold. - -## Data files - -Database: - -https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/FB_ssnpp_database.u8bin - -100k public queries: - -https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/FB_ssnpp_public_queries.u8bin - -Ground truth: - -https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/FB_ssnpp_public_queries_GT.rangeres - -100k held-out queries (the XXXX is known only to the organizers): - -https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/FB_ssnpp_heldout_queries_XXXX.u8bin - -Ground truth: TODO - -## License - -The FB SSN++ dataset is licensed under the [CC-by-NC](https://creativecommons.org/licenses/by-nc/2.0/) license. diff --git a/dataset_preparation/fb_ssnpp_images/IoU.png b/dataset_preparation/fb_ssnpp_images/IoU.png deleted file mode 100644 index 76dde5fde..000000000 Binary files a/dataset_preparation/fb_ssnpp_images/IoU.png and /dev/null differ diff --git a/dataset_preparation/fb_ssnpp_images/distance_histogram.png b/dataset_preparation/fb_ssnpp_images/distance_histogram.png deleted file mode 100644 index ecd2ebc83..000000000 Binary files a/dataset_preparation/fb_ssnpp_images/distance_histogram.png and /dev/null differ diff --git a/dataset_preparation/fb_ssnpp_images/pr_compression.png b/dataset_preparation/fb_ssnpp_images/pr_compression.png deleted file mode 100644 index 7f3c286f2..000000000 Binary files a/dataset_preparation/fb_ssnpp_images/pr_compression.png and /dev/null differ diff --git a/dataset_preparation/fb_ssnpp_images/result_stats.png b/dataset_preparation/fb_ssnpp_images/result_stats.png deleted file mode 100644 index c1a3f0096..000000000 Binary files a/dataset_preparation/fb_ssnpp_images/result_stats.png and /dev/null differ diff --git a/dataset_preparation/make_groundtruth.py b/dataset_preparation/make_groundtruth.py deleted file mode 100644 index 54eae47b7..000000000 --- a/dataset_preparation/make_groundtruth.py +++ /dev/null @@ -1,288 +0,0 @@ -import argparse -import logging -import time -import resource -import pdb - -import numpy as np - -import faiss - -from faiss.contrib.exhaustive_search import range_search_gpu - -import benchmark.datasets -from benchmark.datasets import DATASETS - -""" -for dataset in deep-1B bigann-1B ssnpp-1B text2image-1B msturing-1B msspacev-1B ; do - sbatch --gres=gpu:4 --ntasks=1 --time=30:00:00 --cpus-per-task=40 \ - --partition=learnlab --mem=250g --nodes=1 \ - -J GT.100M.$dataset.d -o logs/GT.100M.$dataset.d.log \ - --wrap "PYTHONPATH=. python dataset_preparation/make_groundtruth.py \ - --dataset $dataset --split 10 0 --prepare \ - --o /checkpoint/matthijs/billion-scale-ann-benchmarks/GT_100M/${dataset/1B/100M} - " -done - -""" - - -class ResultHeap: - """Accumulate query results from a sliced dataset. The final result will - be in self.D, self.I.""" - - def __init__(self, nq, k, keep_max=False): - " nq: number of query vectors, k: number of results per query " - self.I = np.zeros((nq, k), dtype='int64') - self.D = np.zeros((nq, k), dtype='float32') - self.nq, self.k = nq, k - if keep_max: - heaps = faiss.float_minheap_array_t() - else: - heaps = faiss.float_maxheap_array_t() - heaps.k = k - heaps.nh = nq - heaps.val = faiss.swig_ptr(self.D) - heaps.ids = faiss.swig_ptr(self.I) - heaps.heapify() - self.heaps = heaps - - def add_result(self, D, I): - """D, I do not need to be in a particular order (heap or sorted)""" - assert D.shape == (self.nq, self.k) - assert I.shape == (self.nq, self.k) - self.heaps.addn_with_ids( - self.k, faiss.swig_ptr(D), - faiss.swig_ptr(I), self.k) - - def finalize(self): - self.heaps.reorder() - - -def knn_ground_truth(ds, k, bs, split): - """Computes the exact KNN search results for a dataset that possibly - does not fit in RAM but for which we have an iterator that - returns it block by block. - """ - print("loading queries") - xq = ds.get_queries() - - if ds.distance() == "angular": - faiss.normalize_L2(xq) - - print("knn_ground_truth queries size %s k=%d" % (xq.shape, k)) - - t0 = time.time() - nq, d = xq.shape - - metric_type = ( - faiss.METRIC_L2 if ds.distance() == "euclidean" else - faiss.METRIC_INNER_PRODUCT if ds.distance() in ("ip", "angular") else - 1/0 - ) - rh = ResultHeap(nq, k, keep_max=metric_type == faiss.METRIC_INNER_PRODUCT) - - index = faiss.IndexFlat(d, metric_type) - - if faiss.get_num_gpus(): - print('running on %d GPUs' % faiss.get_num_gpus()) - index = faiss.index_cpu_to_all_gpus(index) - - # compute ground-truth by blocks, and add to heaps - i0 = 0 - for xbi in ds.get_dataset_iterator(bs=bs, split=split): - ni = xbi.shape[0] - if ds.distance() == "angular": - faiss.normalize_L2(xbi) - - index.add(xbi) - D, I = index.search(xq, k) - I += i0 - rh.add_result(D, I) - index.reset() - i0 += ni - print(f"[{time.time() - t0:.2f} s] {i0} / {ds.nb} vectors", end="\r", flush=True) - - rh.finalize() - print() - print("GT time: %.3f s (%d vectors)" % (time.time() - t0, i0)) - - return rh.D, rh.I - - -def range_ground_truth(ds, radius, bs, split): - """Computes the exact range search results for a dataset that possibly - does not fit in RAM but for which we have an iterator that - returns it block by block. - """ - print("loading queries") - xq = ds.get_queries() - - if ds.distance() == "angular": - faiss.normalize_L2(xq) - - print("range_ground_truth queries size %s radius=%g" % (xq.shape, radius)) - - t0 = time.time() - nq, d = xq.shape - - metric_type = ( - faiss.METRIC_L2 if ds.distance() == "euclidean" else - faiss.METRIC_INNER_PRODUCT if ds.distance() in ("ip", "angular") else - 1/0 - ) - - index = faiss.IndexFlat(d, metric_type) - - if faiss.get_num_gpus(): - print('running on %d GPUs' % faiss.get_num_gpus()) - index_gpu = faiss.index_cpu_to_all_gpus(index) - else: - index_gpu = None - - results = [] - - # compute ground-truth by blocks, and add to heaps - i0 = 0 - tot_res = 0 - for xbi in ds.get_dataset_iterator(bs=bs, split=split): - ni = xbi.shape[0] - if ds.distance() == "angular": - faiss.normalize_L2(xbi) - - index.add(xbi) - if index_gpu is None: - lims, D, I = index.range_search(xq, radius) - else: - index_gpu.add(xbi) - lims, D, I = range_search_gpu(xq, radius, index_gpu, index) - index_gpu.reset() - index.reset() - I = I.astype("int32") - I += i0 - results.append((lims, D, I)) - i0 += ni - tot_res += len(D) - print(f"[{time.time() - t0:.2f} s] {i0} / {ds.nb} vectors, {tot_res} matches", - end="\r", flush=True) - print() - print("merge into single table") - # merge all results in a single table - nres = np.zeros(nq, dtype="int32") - D = [] - I = [] - for q in range(nq): - nres_q = 0 - for lims_i, Di, Ii in results: - l0, l1 = lims_i[q], lims_i[q + 1] - if l1 > l0: - nres_q += l1 - l0 - D.append(Di[l0:l1]) - I.append(Ii[l0:l1]) - nres[q] = nres_q - - D = np.hstack(D) - I = np.hstack(I) - assert len(D) == nres.sum() == len(I) - print("GT time: %.3f s (%d vectors)" % (time.time() - t0, i0)) - return nres, D, I - -def usbin_write(ids, dist, fname): - ids = np.ascontiguousarray(ids, dtype="int32") - dist = np.ascontiguousarray(dist, dtype="float32") - assert ids.shape == dist.shape - f = open(fname, "wb") - n, d = dist.shape - np.array([n, d], dtype='uint32').tofile(f) - ids.tofile(f) - dist.tofile(f) - - -def range_result_write(nres, I, D, fname): - """ write the range search file format: - int32 n_queries - int32 total_res - int32[n_queries] nb_results_per_query - int32[total_res] database_ids - float32[total_res] distances - """ - nres = np.ascontiguousarray(nres, dtype="int32") - I = np.ascontiguousarray(I, dtype="int32") - D = np.ascontiguousarray(D, dtype="float32") - assert I.shape == D.shape - total_res = nres.sum() - nq = len(nres) - assert I.shape == (total_res, ) - f = open(fname, "wb") - np.array([nq, total_res], dtype='uint32').tofile(f) - nres.tofile(f) - I.tofile(f) - D.tofile(f) - - -if __name__ == "__main__": - parser = argparse.ArgumentParser() - - def aa(*args, **kwargs): - group.add_argument(*args, **kwargs) - - group = parser.add_argument_group('dataset options') - aa('--dataset', choices=DATASETS.keys(), required=True) - aa('--prepare', default=False, action="store_true", - help="call prepare() to download the dataset before computing") - aa('--basedir', help="override basedir for dataset") - aa('--split', type=int, nargs=2, default=[1, 0], - help="split that must be handled") - - group = parser.add_argument_group('computation options') - # determined from ds - # aa('--range_search', action="store_true", help="do range search instead of kNN search") - aa('--k', default=100, type=int, help="number of nearest kNN neighbors to search") - aa('--radius', default=96237, type=float, help="range search radius") - aa('--bs', default=100_000, type=int, help="batch size for database iterator") - aa("--maxRAM", default=100, type=int, help="set max RSS in GB (avoid OOM crash)") - - group = parser.add_argument_group('output options') - aa('--o', default="", help="output file name") - - args = parser.parse_args() - - print("args:", args) - - if args.basedir: - print("setting datasets basedir to", args.basedir) - benchmark.datasets.BASEDIR - benchmark.datasets.BASEDIR = args.basedir - - if args.maxRAM > 0: - print("setting max RSS to", args.maxRAM, "GiB") - resource.setrlimit( - resource.RLIMIT_DATA, (args.maxRAM * 1024 ** 3, resource.RLIM_INFINITY) - ) - - ds = DATASETS[args.dataset]() - - print(ds) - - if args.prepare: - print("downloading dataset...") - ds.prepare() - print("dataset ready") - - if False: # args.crop_nb != -1: - print("cropping dataset to", args.crop_nb) - ds.nb = args.crop_nb - print("new ds:", ds) - - - if ds.search_type() == "knn": - D, I = knn_ground_truth(ds, k=args.k, bs=args.bs, split=args.split) - print(f"writing index matrix of size {I.shape} to {args.o}") - # write in the usbin format - usbin_write(I, D, args.o) - elif ds.search_type() == "range": - nres, D, I = range_ground_truth(ds, radius=args.radius, bs=args.bs, split=args.split) - print(f"writing results {I.shape} to {args.o}") - range_result_write(nres, I, D, args.o) - - diff --git a/dataset_preparation/prepare_bigann.py b/dataset_preparation/prepare_bigann.py deleted file mode 100644 index 9c92a1087..000000000 --- a/dataset_preparation/prepare_bigann.py +++ /dev/null @@ -1,88 +0,0 @@ - -""" -Prepare the bigann dataset in the format expected for the 1B ANN competition - -""" - -import sys - -from faiss.contrib import datasets as faiss_datasets -import numpy as np - - -# source data is in the native Faiss format -ds = faiss_datasets.DatasetBigANN() - -stage = int(sys.argv[1]) - -outdir = "/scratch/matthijs/bigann_competiton_format/" - -def u8bin_write(x, fname): - assert x.dtype == 'uint8' - f = open(fname, "wb") - n, d = x.shape - np.array([n, d], dtype='uint32').tofile(f) - x.tofile(f) - -def ibin_write(x, fname): - assert x.dtype == 'int32' - f = open(fname, "wb") - n, d = x.shape - np.array([n, d], dtype='uint32').tofile(f) - x.tofile(f) - - -if stage == 1: # convert query format - # xq = ds.get_queries() - xq = faiss_datasets.bvecs_mmap(ds.basedir + 'bigann_query.bvecs') - xq = np.ascontiguousarray(xq) - u8bin_write(xq, outdir + "query.public.10K.u8bin") - -elif stage == 2: # sample new queries from train set - secretkey = int(sys.argv[2]) - rs = np.random.RandomState(secretkey) - xt = faiss_datasets.bvecs_mmap(ds.basedir + 'bigann_learn.bvecs') - print("size", xt.shape) - selection = rs.choice(len(xt), 10000, replace=False) - u8bin_write(xt[selection], outdir + f"query.private.{secretkey}.10K.u8bin") - -elif stage == 3: # convert 10M subset - - xb = faiss_datasets.bvecs_mmap(ds.basedir + 'bigann_base.bvecs') - u8bin_write(xb[:10**7], outdir + "base.10M.u8bin") - -elif stage == 4: # write the 1B vectors... - - xb = faiss_datasets.bvecs_mmap(ds.basedir + 'bigann_base.bvecs') - bs = 10**6 - f = open(outdir + "base.1B.u8bin", "wb") - np.array(xb.shape, dtype='uint32').tofile(f) - for i in range(1000): - print(i, end="\r", flush=True) - xb[i * bs : (i + 1) * bs].tofile(f) - -elif stage == 5: # convert the training vectors - - xb = faiss_datasets.bvecs_mmap(ds.basedir + 'bigann_learn.bvecs') - bs = 10**6 - f = open(outdir + "learn.100M.u8bin", "wb") - np.array(xb.shape, dtype='uint32').tofile(f) - for i in range(100): - print(i, end="\r", flush=True) - xb[i * bs : (i + 1) * bs].tofile(f) - -elif stage == 6: - # convert ground-truth files for public queries - gt = ds.get_groundtruth() - ibin_write(gt, outdir + "GT.public.1B.ibin") - - ds10M = faiss_datasets.DatasetBigANN(10) - gt = ds.get_groundtruth() - ibin_write(gt, outdir + "GT.public.10M.ibin") - - - - - - - diff --git a/dataset_preparation/prepare_fb_ssnpp.py b/dataset_preparation/prepare_fb_ssnpp.py deleted file mode 100644 index 59c5fcd06..000000000 --- a/dataset_preparation/prepare_fb_ssnpp.py +++ /dev/null @@ -1,39 +0,0 @@ - -""" -Prepare the FB SSN++ dataset in the format expected for the 1B ANN competition - -The datafiles have already been produced on the prod side: - -- FB_ssnpp_database.u8bin: the 1B database vectors, deduplicated, already - in correct format - -- 1M_queries_no_bursts_compressed.npy: a little less than 1M query vectors, - selected not to be bursty - -""" -import sys -import numpy as np - -secret_suffix = sys.argv[1] - -basedir = "/checkpoint/matthijs/billion-scale-ann-benchmarks/FB_ssnpp/" - -def u8bin_write(x, fname): - assert x.dtype == 'uint8' - f = open(fname, "wb") - n, d = x.shape - np.array([n, d], dtype='uint32').tofile(f) - x.tofile(f) - -xqall_fp32 = np.load(basedir + "1M_queries_no_bursts_compressed.npy") -xqall = xqall_fp32.astype('uint8') -assert np.all(xqall == xqall_fp32) -u8bin_write( - xqall[:10**5], - basedir + "FB_ssnpp_public_queries.u8bin" -) -u8bin_write( - xqall[10**5: 2 * 10**5], - basedir + "FB_ssnpp_heldout_queries_" + secret_suffix + ".u8bin" -) - diff --git a/discord-logo-white.svg b/discord-logo-white.svg new file mode 100644 index 000000000..d81da09a5 --- /dev/null +++ b/discord-logo-white.svg @@ -0,0 +1 @@ + \ No newline at end of file diff --git a/docs/index.html b/docs/index.html index ba195f130..f7b2942da 100644 --- a/docs/index.html +++ b/docs/index.html @@ -1,556 +1,556 @@ - - - - - - - - - Big ANN Benchmarks - - - - - - - - - - - - - - - -
-

Billion-Scale Approximate Nearest Neighbor Search Challenge: NeurIPS'21 competition track

- -

-
- - - - Evaluation framework on github. Subscribe to our - Medium channel - for discussions and announcements. - - - - -
-

NeurIPS'21 leaderboard and session schedule

- -

- Track T1/T2 leaderboard.
- Track T3 leaderboard. -

- - The NeurIPS session for this competition took place on Dec 8. - Find slides of the talks and videos below.
-
    -
  • 11:05-11:25: Overview Talk (slides)
  • -
  • 12:00-12:45: Overview of results presented by organizers, followed by Q&A (video)
  • -
      -
    • Standard hardware tracks T1 and T2 results (slides)
    • -
    • Custom hardware track T3 results (slides)
    • -
    -
  • 12:45-13:20: Invited talk 1 by Prof. Alexandr Andoni: Learning to Hash Robustly, with Guarantees (slides, video)
  • -
  • 13:20-13:55: Invited talk 2 by Prof. Anshumali Shrivastava:Iterative Repartitioning for Learning to Hash and the Power of k-Choices (slides,video)
  • -
  • 13:55-14:30: Talks from track winners. -
      -
    • Track 1: kst_ann_t1 Li Liu, Jin Yu, Guohao Dai, Wei Wu, Yu Qiao, Yu Wang, Lingzhi Liu, Kuaishou Technology and Tsinghua University (slides, video)
    • -
    • Track 2: BBANN Xiaomeng Yi, Xiaofan Luan, Weizhi Xu, Qianya Cheng, Jigao Luo, Xiangyu Wang, Jiquan Long, Xiao Yan, Zheng Bian, Jiarui Luo, Shengjun Li, Chengming Li, Zilliz and Southern University of Science and Technology (slides, video)
    • -
    • Track 3: OptaNNe Sourabh Dongaonkar, Mark Hildebrand, Mariano Tepper, Cecilia Aguerrebere, Ted Willke, Jawad Khan, Intel Corporation, Intel Labs and UC Davis (slides, video)
    • -
    -
  • -
  • 14:30-15:00: Open discussion on competition and future directions (github thread, video)
  • -
- Additional material:Overview Talk. -

- - - -

- Abstract for Invited talk: "Learning to Hash Robustly, with Guarantees"
- There is a gap between the high-dimensional nearest neighbor search - (NNS) algorithms achieving the best worst-case guarantees and the - top-performing ones in practice. The former are based on indexing via - the randomized Locality Sensitive Hashing (LSH), and its - derivatives. The latter "learn" the best indexing method in order to - speed-up NNS, crucially adapting to the structure of the given - dataset. Alas, the latter also almost always come at the cost of - losing the guarantees of either correctness or robust performance on - adversarial queries (or apply to datasets with an assumed extra - structure/model). - - How can we bridge these two perspectives and bring the best of both - worlds? As a step in this direction, we will talk about an NNS algorithm - that has worst-case guarantees essentially matching that of - theoretical algorithms, while optimizing the hashing to the structure - of the dataset (think instance-optimal algorithms) for performance on - the minimum-performing query. We will discuss the algorithm's ability - to optimize for a given dataset from both theoretical and practical - perspective. -

- -

- Abstract for Invited talk: "Iterative Repartitioning for Learning to Hash and the Power of k-Choices"
- Dense embedding models are commonly deployed in commercial - search engines, wherein all the vectors are pre-computed, and - near-neighbor search (NNS) is performed with the query vector to find - relevant documents. However, the bottleneck of indexing a large number - of dense vectors and performing an NNS hurts the query time and - accuracy of these models. In this talk, we argue that high-dimensional - and ultra-sparse embedding is a significantly superior alternative to - dense low-dimensional embedding for both query efficiency and - accuracy. Extreme sparsity eliminates the need for NNS by replacing - them with simple lookups, while its high dimensionality ensures that - the embeddings are informative even when sparse. However, learning - extremely high dimensional embeddings leads to blow-up in the model - size. To make the training feasible, we propose a partitioning - algorithm that learns such high-dimensional embeddings across multiple - GPUs without any communication. We theoretically prove that our way of - one-sided learning is equivalent to learning both query and label - embeddings. We call our novel system designed on sparse embeddings as - IRLI (pronounced `early'), which iteratively partitions the items by - learning the relevant buckets directly from the query-item relevance - data. Furthermore, IRLI employs a superior power-of-k-choices based - load balancing strategy. We mathematically show that IRLI retrieves - the correct item with high probability under very natural assumptions - and provides superior load balancing. IRLI surpasses the best - baseline's precision on multi-label classification while being 5x - faster on inference. For near-neighbor search tasks, the same method - outperforms the state-of-the-art Learned Hashing approach NeuralLSH by - requiring only ~ {1/6}^th of the candidates for the same recall. IRLI - is both data and model parallel, making it ideal for distributed GPU - implementation. We demonstrate this advantage by indexing 100 million - dense vectors and surpassing the popular FAISS library by >10%. -

-
- -
-

Why this competition?

- In the past few years, we’ve seen a lot of new research and creative approaches for large-scale ANNS, including: -
    -
  • Partition-based, and graph-based indexing strategies (as well as hybrid indexing approaches).
  • -
  • Mixing RAM and SSD storage to efficiently store and process large datasets that exceed the size of RAM.
  • -
  • Using accelerator hardware such as GPUs, FPGAs, and other custom in-memory silicon.
  • -
  • Leveraging machine learning for dimensionality reduction of the original vectors.
  • -
-

- In addition to an uptick in academic interest, many implementations of these algorithms at scale now appear in production - and high availability datacenter contexts: powering enterprise-grade, mission-critical, and web-scale search applications. - In these deployment scenarios, benchmarks such as cost, preprocessing time, power consumption become just as important as - the recall-vs-latency tradeoff. Despite this, most empirical evaluations of algorithms have focused on smaller datasets - of about a million points, e.g. ann-bechmarks.com. However, deploying recent algorithmic advances in ANNS techniques for - search, recommendation and ranking at scale requires support at billion or substantially larger scale. Barring a few recent - papers, there is limited consensus on which algorithms are effective at this scale. -

- - We believe that this challenge will be impactful in several ways: -
    -
  • Provide a comparative understanding of algorithmic ideas and their application at scale.
  • -
  • Promote the development of new techniques for the problem and demonstration of their value.
  • -
  • Provide a compilation of datasets, many new, to enable future development of algorithms.
  • -
  • Introduce a standard benchmarking approach.
  • -
- By providing a platform for those interested in this problem, we aim to encourge more collaboration and collectively advance the field at a more rapid pace. - Researchers can request Azure compute credit from a pool sponsored by Microsoft Research. -
- -
-

Tracks

-

Standard Hardware Tracks (T1 and T2)

-

- There are two standard standard hardware tracks: -

    -
  • Track 1: In-memory indices with FAISS as the baseline. - Search would use Azure Standard_F32s_v2 VMs - with 32 vCPUs and 64GB RAM. Index construction would use Azure - Standard_F64s_v2 VM - with 64vCPUs, 128GB RAM and an additional 4TB of SSD to be used for storing the data, index and other intermediate data.
  • -
  • Track 2: Out-of-core indices with DiskANN as the baseline. - In addition to the limited DRAM in T1, index can use an SSD for search. - Search would use Azure - Standard_L8s_v2 VMs with 8 vCPUS, 64GB RAM and a local SSD Index constrained to 1TB. - Construction would use Azure - Standard_F64s_v2 VM - with 64vCPU, 128GB RAM and an additional 4TB of SSD to be used for storing the data, index and other intermediate data.
  • -
- Participants are expected to release their code for index building and search which the organizers will run on separate machines. - Participants provide a configuration for their index build code that would complete in 4 days for each dataset. - The protocol for evaluation is as follows: -
    -
  • [on indexing machine] participants will be given a local path with 1B vector dataset.
  • -
  • [on indexing machine] participants build an index from the 1B vectors and store back to local disk.
  • -
  • [on indexing machine] Stored index is copied out to a temporary cloud storage location by the eval framework.
  • -
  • [on search machine] organizers load the index from cloud storage to a local path and provide the path to the search code.
  • -
  • [on search machine] organizers perform searches with held-out query set and measure recall and time to process the queries with several sets of parameters.
  • -
-

- - Finalized details for build and search hardware timing will be released along with the the eval framework. - -

Custom Hardware Track (T3)

-

- Participants can use non-standard hardware such as GPUs, AI accelerators, FPGAs, and custom in-memory silicon. - In this track, participants will either 1) send their hardware, such as PCI boards to GSI Technology or 2) evaluate - themselves using the scripts made available by the organizers. For T3 participants sending hardware, - we will make specific delivery arrangements at participant’s expense. We will install the hardware on a system under - the organizers control (we have a few bare-metal options available) and follow any installation directions provided. - Participants will be allowed to temporarily log into the machine to finalize any installation and configuration, - or for debugging installation as needed. For T3 participants running the evaluation themselves, we request remote ssh - access and sudo accounts on the systems so that the organizers can verify the system and hardware (such as IPMI support, - minimum resource availability such as disk storage for datasets). - - The evaluation phase will proceed like T1/T2, with a few modifications. -

    -
  • For participants that send their hardware, T3 organizers will provide remote access to a separate indexing machine. -
      -
    • [on separate indexing machine] participants download 1B vector dataset and store to local disk
    • -
    • [on separate indexing machine] participants build an index from the 1B vectors and store back to local disk
    • -
    • Stored index is copied to eval machine
    • -
    • [on eval machine] T3 organizers load the index from local disk
    • -
    • [on eval machine] T3 organizers provide index with held-out query set and measure recall and time to process the queries with several sets of parameters. - Index search code can use internal parallelism to batch process the queries.
    • -
    -
  • -
  • For participants that give us remote access to systems, participants are responsible for building their index. -
      -
    • [on indexing machine] participants download 1B vector dataset and store to local disk
    • -
    • [on indexing machine] participants build an index from the 1B vectors and store back to local disk
    • -
    • Stored index is copied to eval machine
    • -
    • [on eval machine] T3 organizers load the index from local disk
    • -
    • [on eval machine] T3 organizers perform searches with held-out query set and measure recall and search time with several sets of parameters.
    • -
    -
  • -
- - T3 will maintain different leaderboards for each dataset based on the following benchmarks: -
    -
  • Recall vs throughput using the same ranking formula as the T1/T2 track
  • -
  • Power- recall vs throughput/watt and a similar ranking formula to the T1/T2 track.
  • -
  • Cost measured as cost/watt (measured as queries/second/watt and MSRP/watt)
  • -
  • Total cost normalized across all tracks.
  • -
- We will provide the exact details on how we collect and compute these benchmarks as well as additional machine and operating system specification before the competition begins. -

-
- -
-

Benchmark Datasets

- We intend to use the following 6 billion point datasets. -
    -
  • BIGANN consists of SIFT descriptors applied to images from extracted from a large image dataset.
  • -
  • Facebook SimSearchNet++ is a new dataset released by Facebook for this competition. - It consists of features used for image copy detection for integrity purposes. - The features are generated by Facebook SimSearchNet++ model.
  • -
  • Microsoft Turing-ANNS-1B is a new dataset being released by the Microsoft Turing team for this competition. - It consists of Bing queries encoded by Turing AGI v5 that trains Transformers to capture similarity of intent in - web search queries. An early version of the RNN-based AGI Encoder is described in a - SIGIR'19 paper and a blogpost.
  • -
  • Microsoft SPACEV-1B is a new web search related dataset - released by Microsoft Bing for this competition. - It consists of document and query vectors encoded by Microsoft SpaceV Superior model to capture generic intent representation.
  • -
  • Yandex DEEP-1B image descriptor dataset consisting of the projected - and normalized outputs from the last fully-connected layer of the GoogLeNet model, which was pretrained on the Imagenet classification task.
  • -
  • Yandex Text-to-Image-1B is a new cross-model dataset (text and visual), - where database and query vectors have different distributions in a shared representation space. The base set consists of Image embeddings produced by the - Se-ResNext-101 model, and queries are textual embeddings produced by a variant of the DSSM model. Since the distributions are different, a 50M sample - of the query distribution is provided.
  • -
- -

- All datasets are in the common binary format that starts with 8 bytes of data consisting of num_points(uint32_t) - num_dimensions(uint32) followed by num_pts X num_dimensions x sizeof(type) bytes of data stored one vector after another. Data files - will have suffixes .fbin, .u8bin, and .i8bin to represent float32, uint8 and int8 type data. Note that a different query set - will be used for evaluation. The details of the datasets along with links to the base, query and sample sets, and the ground truth nearest neighbors - of the query set are listed below. -

- -

- The ground truth binary files for k-NN search consist of the following information: num_queries(uint32_t) - K-NN(uint32) followed by num_queries X K x sizeof(uint32_t) bytes of data representing the IDs of the K-nearest neighbors of the - queries, followed by num_queries X K x sizeof(float) bytes of data representing the distances to the corresponding points. The distances - help identify neighbors tied in terms of distances. In recall calculation, returning a neighbor not in the ground truth set but whose distance is tied - with an entry in the ground truth is counted as success. -

-

- The ground truth binary files for range search consist of the following information: num_queries(int32_t) followed by the total number - of results total_res(int32_t) followed - by num_queries X size(int32_t) bytes corresponding to num_results_per_query for each query, followed by total_res X sizeof(int32_t) - bytes corresponding to the IDs of the neighbors of each query one after the other. -

-

- The ground truth files for the first 10M slice, the first 100M slice, and the complete 1B set of each dataset against the respective query set can be downloaded - here(10M), - here(100M), and - here(1B). -

- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
Dataset Datatype Dimensions Distance Range/k-NN Base data Sample data Query data Ground truth Release terms
BIGANN uint8 128 L2 k-NN 1B points 100M base points 10K queries link CC0
Facebook SimSearchNet++* uint8 256 L2 Range (squared distance: 96237) 1B points N/A 100k queries link CC BY-NC
Microsoft Turing-ANNS* float32 100 L2 k-NN 1B points N/A 100K queries link link to terms
Microsoft SPACEV* int8 100 L2 k-NN 1B points 100M base points 29.3K queries link O-UDA
Yandex DEEP float32 96 L2 k-NN 1B points 350M base points 10K queries link CC BY 4.0
Yandex Text-to-Image* float32 200 inner-product k-NN 1B points 50M queries 100K queries link CC BY 4.0
- * new datasets
- We recommend using Axel for downloading BIGANN, Facebook-SSN++, Yandex DEEP1B and T2I datasets.
- We recommend using AzCopy for downloading Microsoft datasets. -
- -
-

Metrics

- The competition will measure recall@10 of the algorithms on the 6 data sets a private query set (unreleased) at a fixed query throughput. - Track T1 measures recall of algorithms at 10000 Queries/second (on 32 vCPUs), T2 measures recall at 1500 Queries/second, T2 measures recall at 2000 Queries/second. - The primary metric for comparison in each track will be the sum of improvements in recall over the baseline at the target QPS over all datasets. - Additionally, track T3 will also rank entries by power and cost per query. See this - notebook - for power and cost analysis. - A team has to publish an algorithm and commit to benchmarking on at least 3 datasets to be considered for ranking. Recall regression on a dataset selected - by a team will be continued as a negative score. - The recall@10(AP for SSN++-1B dataset) of the baseline algorithms on each dataset for the public query set is listed below. - - - - - - - - - - - - - - - - - -
Track Algorithm Search MachineTarget Queries/secBIGANN-1B SSN++-1B Turing-ANNS-1B SPACEV-1B DEEP-1B Text-to-Image-1B
Track 1 FAISS-CPU Azure F32s_v2 32vCPUs + 64GB RAM10000 0.634 0.753 0.703 0.728 0.650 0.069
Track 2 DiskANN Azure L8s_v2 8vCPUs + 64GB RAM + 1TB SSD 1500 0.949 0.16274 0.936 0.901 0.937 0.488
Track 3 FAISS-GPU NVIDIA V100 + 700GB RAM2000 0.927 TBA 0.910 0.850 0.942 0.86
-
- -
- Baseline DiskANN indices for T2 can be downloaded using "azcopy copy 'https://comp21storage.blob.core.windows.net/publiccontainer/comp21/diskann-T2-baseline-indices' 'local_folder' --recursive". - Note that this would take some time as the indices are large. All indices were built using R and L parameters set to 100. - Search for T2 used 16 threads and beamwidth 4. The Ls parameter was varied to tune recall vs QPS.
- Update: T2 baseline results have been modified after measuring via pybind11 interface on docker. There was a 30-40% QPS loss using this interface - as compared to direct measurements of C++ code from commandline. As a result, the QPS target has now been lowered, and the recall is reported at this threshold. - - -
-

Call for Participation and Timeline

-

- Participation is open to all teams interested in developing new algorithms or re-implementing - existing algorithms more efficiently either in software or hardware. Participants are - requested to submit a brief document through CMT - for each track they will be competing in. The document should contain the following details: -

    -
  • Name, email and affiliation of each participant in the team
  • -
  • A name and/or URL for the submission.
  • -
  • [Optional] To receive Azure credits for developing new ideas, please submit your request - by June 30th with preliminary data on smaller scale datasets and why you think - your algorithm will work well at billion scale. This will be used by the organizers to select strong - entries. We request teams who already have access to infrastructure (e.g. those from industry or - with access to large university clusters) to skip this.
  • -
- - - For Track T3, the document should contain the following additional details to help organizers plan - and assess eligibility for seperate leaderboards: -
    -
  • Type of hardware, e.g., PCIe extension board, rack-mounted system, or other.
  • -
  • Evidence of the retail MSRP of the hardware, i.e., pricing on website or copy of the customer invoice.
  • -
  • If hardware will be sent to GSI Technology (at the participants expense) or if organizers will given remote access to the systems. - For remote system access participants, whether their system supports standard IPMI power monitoring. - If not IPMI, then an equivalent power monitoring interface must be available. -
  • Operating system requirements.
  • -
  • Whether the participant requires a separate machine for index building. We have limited Azure-based - Fsv2-series machines and some bare-metal machines managed by the T3 organizers.
  • -
-

- -

Consent Forms

- Please review and complete the consent form for participation in Tracks T1/T2 - and Track T3. Note that there are separate consent forms - for the standard and custom hardware tracks. Completing the form is necessary for participation. - -

-

Timeline (subject to change)

-
    -
  • May: release of data, guidelines, and a call for participation. Registration open.
  • -
  • June: Baseline results, testing infrastructure and final ranking metrics released.
  • -
  • July 11th: Participants in need of compute resources to submit an expression of interest.
  • -
  • Mid-July: Allocation of compute resources.
  • -
  • July 30th: Final deadline for participants to submit an expression of interest through CMT.
  • -
  • October 22nd: End of competition period. Teams to release of code in a containerized form, and complete a pull request to the eval framework with code to run the algorithms.
  • -
  • October 29th: Participants submit a brief report outlining their algorithm and results.
  • -
  • Mid-November: Release of preliminary results on standardized machines. Review of code by organizers and participants. Participants can raise concerns about the evaluation.
  • -
  • Early December: Final results published, and competition results archived (the competition will go on if interest continues).
  • -
  • During NeurIPS, organizers will provide an overview of the competition and results. Organizers will also request the best entries - (including leaderboard toppers, or promising new approaches) to present an overview for further discussion.
  • -
-

-
- - -
- + + + + + + + + + Big ANN Benchmarks + + + + + + + + + + + + + + + +
+

Billion-Scale Approximate Nearest Neighbor Search Challenge: NeurIPS'21 competition track

+ +

+
+ + + + Evaluation framework on github. Subscribe to our + Medium channel + for discussions and announcements. + + + + +
+

NeurIPS'21 leaderboard and session schedule

+ +

+ Track T1/T2 leaderboard.
+ Track T3 leaderboard. +

+ + The NeurIPS session for this competition took place on Dec 8. + Find slides of the talks and videos below.
+
    +
  • 11:05-11:25: Overview Talk (slides)
  • +
  • 12:00-12:45: Overview of results presented by organizers, followed by Q&A (video)
  • +
      +
    • Standard hardware tracks T1 and T2 results (slides)
    • +
    • Custom hardware track T3 results (slides)
    • +
    +
  • 12:45-13:20: Invited talk 1 by Prof. Alexandr Andoni: Learning to Hash Robustly, with Guarantees (slides, video)
  • +
  • 13:20-13:55: Invited talk 2 by Prof. Anshumali Shrivastava:Iterative Repartitioning for Learning to Hash and the Power of k-Choices (slides,video)
  • +
  • 13:55-14:30: Talks from track winners. +
      +
    • Track 1: kst_ann_t1 Li Liu, Jin Yu, Guohao Dai, Wei Wu, Yu Qiao, Yu Wang, Lingzhi Liu, Kuaishou Technology and Tsinghua University (slides, video)
    • +
    • Track 2: BBANN Xiaomeng Yi, Xiaofan Luan, Weizhi Xu, Qianya Cheng, Jigao Luo, Xiangyu Wang, Jiquan Long, Xiao Yan, Zheng Bian, Jiarui Luo, Shengjun Li, Chengming Li, Zilliz and Southern University of Science and Technology (slides, video)
    • +
    • Track 3: OptaNNe Sourabh Dongaonkar, Mark Hildebrand, Mariano Tepper, Cecilia Aguerrebere, Ted Willke, Jawad Khan, Intel Corporation, Intel Labs and UC Davis (slides, video)
    • +
    +
  • +
  • 14:30-15:00: Open discussion on competition and future directions (github thread, video)
  • +
+ Additional material:Overview Talk. +

+ + + +

+ Abstract for Invited talk: "Learning to Hash Robustly, with Guarantees"
+ There is a gap between the high-dimensional nearest neighbor search + (NNS) algorithms achieving the best worst-case guarantees and the + top-performing ones in practice. The former are based on indexing via + the randomized Locality Sensitive Hashing (LSH), and its + derivatives. The latter "learn" the best indexing method in order to + speed-up NNS, crucially adapting to the structure of the given + dataset. Alas, the latter also almost always come at the cost of + losing the guarantees of either correctness or robust performance on + adversarial queries (or apply to datasets with an assumed extra + structure/model). + + How can we bridge these two perspectives and bring the best of both + worlds? As a step in this direction, we will talk about an NNS algorithm + that has worst-case guarantees essentially matching that of + theoretical algorithms, while optimizing the hashing to the structure + of the dataset (think instance-optimal algorithms) for performance on + the minimum-performing query. We will discuss the algorithm's ability + to optimize for a given dataset from both theoretical and practical + perspective. +

+ +

+ Abstract for Invited talk: "Iterative Repartitioning for Learning to Hash and the Power of k-Choices"
+ Dense embedding models are commonly deployed in commercial + search engines, wherein all the vectors are pre-computed, and + near-neighbor search (NNS) is performed with the query vector to find + relevant documents. However, the bottleneck of indexing a large number + of dense vectors and performing an NNS hurts the query time and + accuracy of these models. In this talk, we argue that high-dimensional + and ultra-sparse embedding is a significantly superior alternative to + dense low-dimensional embedding for both query efficiency and + accuracy. Extreme sparsity eliminates the need for NNS by replacing + them with simple lookups, while its high dimensionality ensures that + the embeddings are informative even when sparse. However, learning + extremely high dimensional embeddings leads to blow-up in the model + size. To make the training feasible, we propose a partitioning + algorithm that learns such high-dimensional embeddings across multiple + GPUs without any communication. We theoretically prove that our way of + one-sided learning is equivalent to learning both query and label + embeddings. We call our novel system designed on sparse embeddings as + IRLI (pronounced `early'), which iteratively partitions the items by + learning the relevant buckets directly from the query-item relevance + data. Furthermore, IRLI employs a superior power-of-k-choices based + load balancing strategy. We mathematically show that IRLI retrieves + the correct item with high probability under very natural assumptions + and provides superior load balancing. IRLI surpasses the best + baseline's precision on multi-label classification while being 5x + faster on inference. For near-neighbor search tasks, the same method + outperforms the state-of-the-art Learned Hashing approach NeuralLSH by + requiring only ~ {1/6}^th of the candidates for the same recall. IRLI + is both data and model parallel, making it ideal for distributed GPU + implementation. We demonstrate this advantage by indexing 100 million + dense vectors and surpassing the popular FAISS library by >10%. +

+
+ +
+

Why this competition?

+ In the past few years, we’ve seen a lot of new research and creative approaches for large-scale ANNS, including: +
    +
  • Partition-based, and graph-based indexing strategies (as well as hybrid indexing approaches).
  • +
  • Mixing RAM and SSD storage to efficiently store and process large datasets that exceed the size of RAM.
  • +
  • Using accelerator hardware such as GPUs, FPGAs, and other custom in-memory silicon.
  • +
  • Leveraging machine learning for dimensionality reduction of the original vectors.
  • +
+

+ In addition to an uptick in academic interest, many implementations of these algorithms at scale now appear in production + and high availability datacenter contexts: powering enterprise-grade, mission-critical, and web-scale search applications. + In these deployment scenarios, benchmarks such as cost, preprocessing time, power consumption become just as important as + the recall-vs-latency tradeoff. Despite this, most empirical evaluations of algorithms have focused on smaller datasets + of about a million points, e.g. ann-bechmarks.com. However, deploying recent algorithmic advances in ANNS techniques for + search, recommendation and ranking at scale requires support at billion or substantially larger scale. Barring a few recent + papers, there is limited consensus on which algorithms are effective at this scale. +

+ + We believe that this challenge will be impactful in several ways: +
    +
  • Provide a comparative understanding of algorithmic ideas and their application at scale.
  • +
  • Promote the development of new techniques for the problem and demonstration of their value.
  • +
  • Provide a compilation of datasets, many new, to enable future development of algorithms.
  • +
  • Introduce a standard benchmarking approach.
  • +
+ By providing a platform for those interested in this problem, we aim to encourge more collaboration and collectively advance the field at a more rapid pace. + Researchers can request Azure compute credit from a pool sponsored by Microsoft Research. +
+ +
+

Tracks

+

Standard Hardware Tracks (T1 and T2)

+

+ There are two standard standard hardware tracks: +

    +
  • Track 1: In-memory indices with FAISS as the baseline. + Search would use Azure Standard_F32s_v2 VMs + with 32 vCPUs and 64GB RAM. Index construction would use Azure + Standard_F64s_v2 VM + with 64vCPUs, 128GB RAM and an additional 4TB of SSD to be used for storing the data, index and other intermediate data.
  • +
  • Track 2: Out-of-core indices with DiskANN as the baseline. + In addition to the limited DRAM in T1, index can use an SSD for search. + Search would use Azure + Standard_L8s_v2 VMs with 8 vCPUS, 64GB RAM and a local SSD Index constrained to 1TB. + Construction would use Azure + Standard_F64s_v2 VM + with 64vCPU, 128GB RAM and an additional 4TB of SSD to be used for storing the data, index and other intermediate data.
  • +
+ Participants are expected to release their code for index building and search which the organizers will run on separate machines. + Participants provide a configuration for their index build code that would complete in 4 days for each dataset. + The protocol for evaluation is as follows: +
    +
  • [on indexing machine] participants will be given a local path with 1B vector dataset.
  • +
  • [on indexing machine] participants build an index from the 1B vectors and store back to local disk.
  • +
  • [on indexing machine] Stored index is copied out to a temporary cloud storage location by the eval framework.
  • +
  • [on search machine] organizers load the index from cloud storage to a local path and provide the path to the search code.
  • +
  • [on search machine] organizers perform searches with held-out query set and measure recall and time to process the queries with several sets of parameters.
  • +
+

+ + Finalized details for build and search hardware timing will be released along with the the eval framework. + +

Custom Hardware Track (T3)

+

+ Participants can use non-standard hardware such as GPUs, AI accelerators, FPGAs, and custom in-memory silicon. + In this track, participants will either 1) send their hardware, such as PCI boards to GSI Technology or 2) evaluate + themselves using the scripts made available by the organizers. For T3 participants sending hardware, + we will make specific delivery arrangements at participant’s expense. We will install the hardware on a system under + the organizers control (we have a few bare-metal options available) and follow any installation directions provided. + Participants will be allowed to temporarily log into the machine to finalize any installation and configuration, + or for debugging installation as needed. For T3 participants running the evaluation themselves, we request remote ssh + access and sudo accounts on the systems so that the organizers can verify the system and hardware (such as IPMI support, + minimum resource availability such as disk storage for datasets). + + The evaluation phase will proceed like T1/T2, with a few modifications. +

    +
  • For participants that send their hardware, T3 organizers will provide remote access to a separate indexing machine. +
      +
    • [on separate indexing machine] participants download 1B vector dataset and store to local disk
    • +
    • [on separate indexing machine] participants build an index from the 1B vectors and store back to local disk
    • +
    • Stored index is copied to eval machine
    • +
    • [on eval machine] T3 organizers load the index from local disk
    • +
    • [on eval machine] T3 organizers provide index with held-out query set and measure recall and time to process the queries with several sets of parameters. + Index search code can use internal parallelism to batch process the queries.
    • +
    +
  • +
  • For participants that give us remote access to systems, participants are responsible for building their index. +
      +
    • [on indexing machine] participants download 1B vector dataset and store to local disk
    • +
    • [on indexing machine] participants build an index from the 1B vectors and store back to local disk
    • +
    • Stored index is copied to eval machine
    • +
    • [on eval machine] T3 organizers load the index from local disk
    • +
    • [on eval machine] T3 organizers perform searches with held-out query set and measure recall and search time with several sets of parameters.
    • +
    +
  • +
+ + T3 will maintain different leaderboards for each dataset based on the following benchmarks: +
    +
  • Recall vs throughput using the same ranking formula as the T1/T2 track
  • +
  • Power- recall vs throughput/watt and a similar ranking formula to the T1/T2 track.
  • +
  • Cost measured as cost/watt (measured as queries/second/watt and MSRP/watt)
  • +
  • Total cost normalized across all tracks.
  • +
+ We will provide the exact details on how we collect and compute these benchmarks as well as additional machine and operating system specification before the competition begins. +

+
+ +
+

Benchmark Datasets

+ We intend to use the following 6 billion point datasets. +
    +
  • BIGANN consists of SIFT descriptors applied to images from extracted from a large image dataset.
  • +
  • Facebook SimSearchNet++ is a new dataset released by Facebook for this competition. + It consists of features used for image copy detection for integrity purposes. + The features are generated by Facebook SimSearchNet++ model.
  • +
  • Microsoft Turing-ANNS-1B is a new dataset being released by the Microsoft Turing team for this competition. + It consists of Bing queries encoded by Turing AGI v5 that trains Transformers to capture similarity of intent in + web search queries. An early version of the RNN-based AGI Encoder is described in a + SIGIR'19 paper and a blogpost.
  • +
  • Microsoft SPACEV-1B is a new web search related dataset + released by Microsoft Bing for this competition. + It consists of document and query vectors encoded by Microsoft SpaceV Superior model to capture generic intent representation.
  • +
  • Yandex DEEP-1B image descriptor dataset consisting of the projected + and normalized outputs from the last fully-connected layer of the GoogLeNet model, which was pretrained on the Imagenet classification task.
  • +
  • Yandex Text-to-Image-1B is a new cross-model dataset (text and visual), + where database and query vectors have different distributions in a shared representation space. The base set consists of Image embeddings produced by the + Se-ResNext-101 model, and queries are textual embeddings produced by a variant of the DSSM model. Since the distributions are different, a 50M sample + of the query distribution is provided.
  • +
+ +

+ All datasets are in the common binary format that starts with 8 bytes of data consisting of num_points(uint32_t) + num_dimensions(uint32) followed by num_pts X num_dimensions x sizeof(type) bytes of data stored one vector after another. Data files + will have suffixes .fbin, .u8bin, and .i8bin to represent float32, uint8 and int8 type data. Note that a different query set + will be used for evaluation. The details of the datasets along with links to the base, query and sample sets, and the ground truth nearest neighbors + of the query set are listed below. +

+ +

+ The ground truth binary files for k-NN search consist of the following information: num_queries(uint32_t) + K-NN(uint32) followed by num_queries X K x sizeof(uint32_t) bytes of data representing the IDs of the K-nearest neighbors of the + queries, followed by num_queries X K x sizeof(float) bytes of data representing the distances to the corresponding points. The distances + help identify neighbors tied in terms of distances. In recall calculation, returning a neighbor not in the ground truth set but whose distance is tied + with an entry in the ground truth is counted as success. +

+

+ The ground truth binary files for range search consist of the following information: num_queries(int32_t) followed by the total number + of results total_res(int32_t) followed + by num_queries X size(int32_t) bytes corresponding to num_results_per_query for each query, followed by total_res X sizeof(int32_t) + bytes corresponding to the IDs of the neighbors of each query one after the other. +

+

+ The ground truth files for the first 10M slice, the first 100M slice, and the complete 1B set of each dataset against the respective query set can be downloaded + here(10M), + here(100M), and + here(1B). +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
Dataset Datatype Dimensions Distance Range/k-NN Base data Sample data Query data Ground truth Release terms
BIGANN uint8 128 L2 k-NN 1B points 100M base points 10K queries link CC0
Facebook SimSearchNet++* uint8 256 L2 Range (squared distance: 96237) 1B points N/A 100k queries link CC BY-NC
Microsoft Turing-ANNS* float32 100 L2 k-NN 1B points N/A 100K queries link link to terms
Microsoft SPACEV* int8 100 L2 k-NN 1B points 100M base points 29.3K queries link O-UDA
Yandex DEEP float32 96 L2 k-NN 1B points 350M base points 10K queries link CC BY 4.0
Yandex Text-to-Image* float32 200 inner-product k-NN 1B points 50M queries 100K queries link CC BY 4.0
+ * new datasets
+ We recommend using Axel for downloading BIGANN, Facebook-SSN++, Yandex DEEP1B and T2I datasets.
+ We recommend using AzCopy for downloading Microsoft datasets. +
+ +
+

Metrics

+ The competition will measure recall@10 of the algorithms on the 6 data sets a private query set (unreleased) at a fixed query throughput. + Track T1 measures recall of algorithms at 10000 Queries/second (on 32 vCPUs), T2 measures recall at 1500 Queries/second, T2 measures recall at 2000 Queries/second. + The primary metric for comparison in each track will be the sum of improvements in recall over the baseline at the target QPS over all datasets. + Additionally, track T3 will also rank entries by power and cost per query. See this + notebook + for power and cost analysis. + A team has to publish an algorithm and commit to benchmarking on at least 3 datasets to be considered for ranking. Recall regression on a dataset selected + by a team will be continued as a negative score. + The recall@10(AP for SSN++-1B dataset) of the baseline algorithms on each dataset for the public query set is listed below. + + + + + + + + + + + + + + + + + +
Track Algorithm Search MachineTarget Queries/secBIGANN-1B SSN++-1B Turing-ANNS-1B SPACEV-1B DEEP-1B Text-to-Image-1B
Track 1 FAISS-CPU Azure F32s_v2 32vCPUs + 64GB RAM10000 0.634 0.753 0.703 0.728 0.650 0.069
Track 2 DiskANN Azure L8s_v2 8vCPUs + 64GB RAM + 1TB SSD 1500 0.949 0.16274 0.936 0.901 0.937 0.488
Track 3 FAISS-GPU NVIDIA V100 + 700GB RAM2000 0.927 TBA 0.910 0.850 0.942 0.86
+
+ +
+ Baseline DiskANN indices for T2 can be downloaded using "azcopy copy 'https://comp21storage.blob.core.windows.net/publiccontainer/comp21/diskann-T2-baseline-indices' 'local_folder' --recursive". + Note that this would take some time as the indices are large. All indices were built using R and L parameters set to 100. + Search for T2 used 16 threads and beamwidth 4. The Ls parameter was varied to tune recall vs QPS.
+ Update: T2 baseline results have been modified after measuring via pybind11 interface on docker. There was a 30-40% QPS loss using this interface + as compared to direct measurements of C++ code from commandline. As a result, the QPS target has now been lowered, and the recall is reported at this threshold. + + +
+

Call for Participation and Timeline

+

+ Participation is open to all teams interested in developing new algorithms or re-implementing + existing algorithms more efficiently either in software or hardware. Participants are + requested to submit a brief document through CMT + for each track they will be competing in. The document should contain the following details: +

    +
  • Name, email and affiliation of each participant in the team
  • +
  • A name and/or URL for the submission.
  • +
  • [Optional] To receive Azure credits for developing new ideas, please submit your request + by June 30th with preliminary data on smaller scale datasets and why you think + your algorithm will work well at billion scale. This will be used by the organizers to select strong + entries. We request teams who already have access to infrastructure (e.g. those from industry or + with access to large university clusters) to skip this.
  • +
+ + + For Track T3, the document should contain the following additional details to help organizers plan + and assess eligibility for seperate leaderboards: +
    +
  • Type of hardware, e.g., PCIe extension board, rack-mounted system, or other.
  • +
  • Evidence of the retail MSRP of the hardware, i.e., pricing on website or copy of the customer invoice.
  • +
  • If hardware will be sent to GSI Technology (at the participants expense) or if organizers will given remote access to the systems. + For remote system access participants, whether their system supports standard IPMI power monitoring. + If not IPMI, then an equivalent power monitoring interface must be available. +
  • Operating system requirements.
  • +
  • Whether the participant requires a separate machine for index building. We have limited Azure-based + Fsv2-series machines and some bare-metal machines managed by the T3 organizers.
  • +
+

+ +

Consent Forms

+ Please review and complete the consent form for participation in Tracks T1/T2 + and Track T3. Note that there are separate consent forms + for the standard and custom hardware tracks. Completing the form is necessary for participation. + +

+

Timeline (subject to change)

+
    +
  • May: release of data, guidelines, and a call for participation. Registration open.
  • +
  • June: Baseline results, testing infrastructure and final ranking metrics released.
  • +
  • July 11th: Participants in need of compute resources to submit an expression of interest.
  • +
  • Mid-July: Allocation of compute resources.
  • +
  • July 30th: Final deadline for participants to submit an expression of interest through CMT.
  • +
  • October 22nd: End of competition period. Teams to release of code in a containerized form, and complete a pull request to the eval framework with code to run the algorithms.
  • +
  • October 29th: Participants submit a brief report outlining their algorithm and results.
  • +
  • Mid-November: Release of preliminary results on standardized machines. Review of code by organizers and participants. Participants can raise concerns about the evaluation.
  • +
  • Early December: Final results published, and competition results archived (the competition will go on if interest continues).
  • +
  • During NeurIPS, organizers will provide an overview of the competition and results. Organizers will also request the best entries + (including leaderboard toppers, or promising new approaches) to present an overview for further discussion.
  • +
+

+
+ + +
+ \ No newline at end of file diff --git a/eval/show_operating_points.py b/eval/show_operating_points.py deleted file mode 100644 index b1c224d57..000000000 --- a/eval/show_operating_points.py +++ /dev/null @@ -1,26 +0,0 @@ -import argparse -import pandas as pd - -if __name__ == "__main__": - parser = argparse.ArgumentParser() - parser.add_argument( - '--algorithm', - required=True) - parser.add_argument( - '--threshold', - default=10000, - help='minimum QPS (10,000 T1/2,000 T2)', - type=int) - parser.add_argument( - 'csv', - metavar='CSV', - help='input csv') - - args = parser.parse_args() - df = pd.read_csv(args.csv) - - print(df[(df.qps > args.threshold) & (df.algorithm == args.algorithm)].groupby(['algorithm', 'dataset']).max()[['recall/ap']]) - - - - diff --git a/fonts/MediumLLWeb-Regular.woff2 b/fonts/MediumLLWeb-Regular.woff2 new file mode 100644 index 000000000..8531f544f Binary files /dev/null and b/fonts/MediumLLWeb-Regular.woff2 differ diff --git a/fonts/MediumLLWeb-SemiBold.woff2 b/fonts/MediumLLWeb-SemiBold.woff2 new file mode 100644 index 000000000..fe88205ce Binary files /dev/null and b/fonts/MediumLLWeb-SemiBold.woff2 differ diff --git a/index.html b/index.html index aeea3c4de..56b5f9261 100644 --- a/index.html +++ b/index.html @@ -1,551 +1,9 @@ - - - - - - - - Big ANN Benchmarks - - - - - - - - - - - - - - - -
-

Billion-Scale Approximate Nearest Neighbor Search Challenge: NeurIPS'21 competition track

- -

- - - - -

Code, Report, Results and Blogs

- - -
-

NeurIPS'21 session schedule

- The NeurIPS session for this competition is scheduled for Dec 8. - NeurIPS registration is required for access to the session.
- Overview Talk and Break-out session schedule (GMT). -
    -
  • 11:05-11:25: Overview Talk (slides)
  • -
  • 12:00-12:45: Overview of results presented by organizers, followed by Q&A
  • -
      -
    • Standard hardware tracks T1 and T2 results (slides)
    • -
    • Custom hardware track T3 results (slides)
    • -
    -
  • 12:45-13:20: Invited talk 1 by Prof. Alexandr Andoni: Learning to Hash Robustly, with Guarantees (slides)
  • -
  • 13:20-13:55: Invited talk 2 by Prof. Anshumali Shrivastava:Iterative Repartitioning for Learning to Hash and the Power of k-Choices (slides)
  • -
  • 13:55-14:30: Talks from track winners. -
      -
    • Track 1: kst_ann_t1 Li Liu, Jin Yu, Guohao Dai, Wei Wu, Yu Qiao, Yu Wang, Lingzhi Liu, Kuaishou Technology and Tsinghua University
    • -
    • Track 2: BBANN Xiaomeng Yi, Xiaofan Luan, Weizhi Xu, Qianya Cheng, Jigao Luo, Xiangyu Wang, Jiquan Long, Xiao Yan, Zheng Bian, Jiarui Luo, Shengjun Li, Chengming Li, Zilliz and Southern University of Science and Technology (slides)
    • -
    • Track 3: OptaNNe Sourabh Dongaonkar, Mark Hildebrand, Mariano Tepper, Cecilia Aguerrebere, Ted Willke, Jawad Khan, Intel Corporation, Intel Labs and UC Davis (slides)
    • -
    -
  • -
  • 14:30-15:00: Open discussion on competition and future directions (github thread)
  • -
-

- - - -

- Abstract for Invited talk: "Learning to Hash Robustly, with Guarantees"
- There is a gap between the high-dimensional nearest neighbor search - (NNS) algorithms achieving the best worst-case guarantees and the - top-performing ones in practice. The former are based on indexing via - the randomized Locality Sensitive Hashing (LSH), and its - derivatives. The latter "learn" the best indexing method in order to - speed-up NNS, crucially adapting to the structure of the given - dataset. Alas, the latter also almost always come at the cost of - losing the guarantees of either correctness or robust performance on - adversarial queries (or apply to datasets with an assumed extra - structure/model). - - How can we bridge these two perspectives and bring the best of both - worlds? As a step in this direction, we will talk about an NNS algorithm - that has worst-case guarantees essentially matching that of - theoretical algorithms, while optimizing the hashing to the structure - of the dataset (think instance-optimal algorithms) for performance on - the minimum-performing query. We will discuss the algorithm's ability - to optimize for a given dataset from both theoretical and practical - perspective. -

- -

- Abstract for Invited talk: "Iterative Repartitioning for Learning to Hash and the Power of k-Choices"
- Dense embedding models are commonly deployed in commercial - search engines, wherein all the vectors are pre-computed, and - near-neighbor search (NNS) is performed with the query vector to find - relevant documents. However, the bottleneck of indexing a large number - of dense vectors and performing an NNS hurts the query time and - accuracy of these models. In this talk, we argue that high-dimensional - and ultra-sparse embedding is a significantly superior alternative to - dense low-dimensional embedding for both query efficiency and - accuracy. Extreme sparsity eliminates the need for NNS by replacing - them with simple lookups, while its high dimensionality ensures that - the embeddings are informative even when sparse. However, learning - extremely high dimensional embeddings leads to blow-up in the model - size. To make the training feasible, we propose a partitioning - algorithm that learns such high-dimensional embeddings across multiple - GPUs without any communication. We theoretically prove that our way of - one-sided learning is equivalent to learning both query and label - embeddings. We call our novel system designed on sparse embeddings as - IRLI (pronounced `early'), which iteratively partitions the items by - learning the relevant buckets directly from the query-item relevance - data. Furthermore, IRLI employs a superior power-of-k-choices based - load balancing strategy. We mathematically show that IRLI retrieves - the correct item with high probability under very natural assumptions - and provides superior load balancing. IRLI surpasses the best - baseline's precision on multi-label classification while being 5x - faster on inference. For near-neighbor search tasks, the same method - outperforms the state-of-the-art Learned Hashing approach NeuralLSH by - requiring only ~ {1/6}^th of the candidates for the same recall. IRLI - is both data and model parallel, making it ideal for distributed GPU - implementation. We demonstrate this advantage by indexing 100 million - dense vectors and surpassing the popular FAISS library by >10%. -

-
- -
-

Why this competition?

- In the past few years, we’ve seen a lot of new research and creative approaches for large-scale ANNS, including: -
    -
  • Partition-based, and graph-based indexing strategies (as well as hybrid indexing approaches).
  • -
  • Mixing RAM and SSD storage to efficiently store and process large datasets that exceed the size of RAM.
  • -
  • Using accelerator hardware such as GPUs, FPGAs, and other custom in-memory silicon.
  • -
  • Leveraging machine learning for dimensionality reduction of the original vectors.
  • -
-

- In addition to an uptick in academic interest, many implementations of these algorithms at scale now appear in production - and high availability datacenter contexts: powering enterprise-grade, mission-critical, and web-scale search applications. - In these deployment scenarios, benchmarks such as cost, preprocessing time, power consumption become just as important as - the recall-vs-latency tradeoff. Despite this, most empirical evaluations of algorithms have focused on smaller datasets - of about a million points, e.g. ann-bechmarks.com. However, deploying recent algorithmic advances in ANNS techniques for - search, recommendation and ranking at scale requires support at billion or substantially larger scale. Barring a few recent - papers, there is limited consensus on which algorithms are effective at this scale. -

- - We believe that this challenge will be impactful in several ways: -
    -
  • Provide a comparative understanding of algorithmic ideas and their application at scale.
  • -
  • Promote the development of new techniques for the problem and demonstration of their value.
  • -
  • Provide a compilation of datasets, many new, to enable future development of algorithms.
  • -
  • Introduce a standard benchmarking approach.
  • -
- By providing a platform for those interested in this problem, we aim to encourge more collaboration and collectively advance the field at a more rapid pace. - Researchers can request Azure compute credit from a pool sponsored by Microsoft Research. -
- -
-

Tracks

-

Standard Hardware Tracks (T1 and T2)

-

- There are two standard standard hardware tracks: -

    -
  • Track 1: In-memory indices with FAISS as the baseline. - Search would use Azure Standard_F32s_v2 VMs - with 32 vCPUs and 64GB RAM. Index construction would use Azure - Standard_F64s_v2 VM - with 64vCPUs, 128GB RAM and an additional 4TB of SSD to be used for storing the data, index and other intermediate data.
  • -
  • Track 2: Out-of-core indices with DiskANN as the baseline. - In addition to the limited DRAM in T1, index can use an SSD for search. - Search would use Azure - Standard_L8s_v2 VMs with 8 vCPUS, 64GB RAM and a local SSD Index constrained to 1TB. - Construction would use Azure - Standard_F64s_v2 VM - with 64vCPU, 128GB RAM and an additional 4TB of SSD to be used for storing the data, index and other intermediate data.
  • -
- Participants are expected to release their code for index building and search which the organizers will run on separate machines. - Participants provide a configuration for their index build code that would complete in 4 days for each dataset. - The protocol for evaluation is as follows: -
    -
  • [on indexing machine] participants will be given a local path with 1B vector dataset.
  • -
  • [on indexing machine] participants build an index from the 1B vectors and store back to local disk.
  • -
  • [on indexing machine] Stored index is copied out to a temporary cloud storage location by the eval framework.
  • -
  • [on search machine] organizers load the index from cloud storage to a local path and provide the path to the search code.
  • -
  • [on search machine] organizers perform searches with held-out query set and measure recall and time to process the queries with several sets of parameters.
  • -
-

- - Finalized details for build and search hardware timing will be released along with the the eval framework. - -

Custom Hardware Track (T3)

-

- Participants can use non-standard hardware such as GPUs, AI accelerators, FPGAs, and custom in-memory silicon. - In this track, participants will either 1) send their hardware, such as PCI boards to GSI Technology or 2) evaluate - themselves using the scripts made available by the organizers. For T3 participants sending hardware, - we will make specific delivery arrangements at participant’s expense. We will install the hardware on a system under - the organizers control (we have a few bare-metal options available) and follow any installation directions provided. - Participants will be allowed to temporarily log into the machine to finalize any installation and configuration, - or for debugging installation as needed. For T3 participants running the evaluation themselves, we request remote ssh - access and sudo accounts on the systems so that the organizers can verify the system and hardware (such as IPMI support, - minimum resource availability such as disk storage for datasets). - - The evaluation phase will proceed like T1/T2, with a few modifications. -

    -
  • For participants that send their hardware, T3 organizers will provide remote access to a separate indexing machine. -
      -
    • [on separate indexing machine] participants download 1B vector dataset and store to local disk
    • -
    • [on separate indexing machine] participants build an index from the 1B vectors and store back to local disk
    • -
    • Stored index is copied to eval machine
    • -
    • [on eval machine] T3 organizers load the index from local disk
    • -
    • [on eval machine] T3 organizers provide index with held-out query set and measure recall and time to process the queries with several sets of parameters. - Index search code can use internal parallelism to batch process the queries.
    • -
    -
  • -
  • For participants that give us remote access to systems, participants are responsible for building their index. -
      -
    • [on indexing machine] participants download 1B vector dataset and store to local disk
    • -
    • [on indexing machine] participants build an index from the 1B vectors and store back to local disk
    • -
    • Stored index is copied to eval machine
    • -
    • [on eval machine] T3 organizers load the index from local disk
    • -
    • [on eval machine] T3 organizers perform searches with held-out query set and measure recall and search time with several sets of parameters.
    • -
    -
  • -
- - T3 will maintain different leaderboards for each dataset based on the following benchmarks: -
    -
  • Recall vs throughput using the same ranking formula as the T1/T2 track
  • -
  • Power- recall vs throughput/watt and a similar ranking formula to the T1/T2 track.
  • -
  • Cost measured as cost/watt (measured as queries/second/watt and MSRP/watt)
  • -
  • Total cost normalized across all tracks.
  • -
- We will provide the exact details on how we collect and compute these benchmarks as well as additional machine and operating system specification before the competition begins. -

-
- -
-

Benchmark Datasets

- We intend to use the following 6 billion point datasets. -
    -
  • BIGANN consists of SIFT descriptors applied to images from extracted from a large image dataset.
  • -
  • Facebook SimSearchNet++ is a new dataset released by Facebook for this competition. - It consists of features used for image copy detection for integrity purposes. - The features are generated by Facebook SimSearchNet++ model.
  • -
  • Microsoft Turing-ANNS-1B is a new dataset being released by the Microsoft Turing team for this competition. - It consists of Bing queries encoded by Turing AGI v5 that trains Transformers to capture similarity of intent in - web search queries. An early version of the RNN-based AGI Encoder is described in a - SIGIR'19 paper and a blogpost.
  • -
  • Microsoft SPACEV-1B is a new web search related dataset - released by Microsoft Bing for this competition. - It consists of document and query vectors encoded by Microsoft SpaceV Superior model to capture generic intent representation.
  • -
  • Yandex DEEP-1B image descriptor dataset consisting of the projected - and normalized outputs from the last fully-connected layer of the GoogLeNet model, which was pretrained on the Imagenet classification task.
  • -
  • Yandex Text-to-Image-1B is a new cross-model dataset (text and visual), - where database and query vectors have different distributions in a shared representation space. The base set consists of Image embeddings produced by the - Se-ResNext-101 model, and queries are textual embeddings produced by a variant of the DSSM model. Since the distributions are different, a 50M sample - of the query distribution is provided.
  • -
- -

- All datasets are in the common binary format that starts with 8 bytes of data consisting of num_points(uint32_t) - num_dimensions(uint32) followed by num_pts X num_dimensions x sizeof(type) bytes of data stored one vector after another. Data files - will have suffixes .fbin, .u8bin, and .i8bin to represent float32, uint8 and int8 type data. Note that a different query set - will be used for evaluation. The details of the datasets along with links to the base, query and sample sets, and the ground truth nearest neighbors - of the query set are listed below. -

- -

- The ground truth binary files for k-NN search consist of the following information: num_queries(uint32_t) - K-NN(uint32) followed by num_queries X K x sizeof(uint32_t) bytes of data representing the IDs of the K-nearest neighbors of the - queries, followed by num_queries X K x sizeof(float) bytes of data representing the distances to the corresponding points. The distances - help identify neighbors tied in terms of distances. In recall calculation, returning a neighbor not in the ground truth set but whose distance is tied - with an entry in the ground truth is counted as success. -

-

- The ground truth binary files for range search consist of the following information: num_queries(int32_t) followed by the total number - of results total_res(int32_t) followed - by num_queries X size(int32_t) bytes corresponding to num_results_per_query for each query, followed by total_res X sizeof(int32_t) - bytes corresponding to the IDs of the neighbors of each query one after the other. -

-

- The ground truth files for the first 10M slice, the first 100M slice, and the complete 1B set of each dataset against the respective query set can be downloaded - here(10M), - here(100M), and - here(1B). -

- - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - -
Dataset Datatype Dimensions Distance Range/k-NN Base data Sample data Query data Ground truth Release terms
BIGANN uint8 128 L2 k-NN 1B points 100M base points 10K queries link CC0
Facebook SimSearchNet++* uint8 256 L2 Range 1B points N/A 100k queries link CC BY-NC
Microsoft Turing-ANNS* float32 100 L2 k-NN 1B points N/A 100K queries link link to terms
Microsoft SPACEV* int8 100 L2 k-NN 1B points 100M base points 29.3K queries link O-UDA
Yandex DEEP float32 96 L2 k-NN 1B points 350M base points 10K queries link CC BY 4.0
Yandex Text-to-Image* float32 200 inner-product k-NN 1B points 50M queries 100K queries link CC BY 4.0
- * new datasets
- We recommend using Axel for downloading BIGANN, Facebook-SSN++, Yandex DEEP1B and T2I datasets.
- We recommend using AzCopy for downloading Microsoft datasets. -
- -
-

Metrics

- The competition will measure recall@10 of the algorithms on the 6 data sets a private query set (unreleased) at a fixed query throughput. - Track T1 measures recall of algorithms at 10000 Queries/second (on 32 vCPUs), T2 measures recall at 1500 Queries/second, T2 measures recall at 2000 Queries/second. - The primary metric for comparison in each track will be the sum of improvements in recall over the baseline at the target QPS over all datasets. - Additionally, track T3 will also rank entries by power and cost per query. See this - notebook - for power and cost analysis. - A team has to publish an algorithm and commit to benchmarking on at least 3 datasets to be considered for ranking. Recall regression on a dataset selected - by a team will be continued as a negative score. - The recall@10(AP for SSN++-1B dataset) of the baseline algorithms on each dataset for the public query set is listed below. - - - - - - - - - - - - - - - - - -
Track Algorithm Search MachineTarget Queries/secBIGANN-1B SSN++-1B Turing-ANNS-1B SPACEV-1B DEEP-1B Text-to-Image-1B
Track 1 FAISS-CPU Azure F32s_v2 32vCPUs + 64GB RAM10000 0.634 0.753 0.703 0.728 0.650 0.069
Track 2 DiskANN Azure L8s_v2 8vCPUs + 64GB RAM + 1TB SSD 1500 0.949 0.16274 0.936 0.901 0.937 0.488
Track 3 FAISS-GPU NVIDIA V100 + 700GB RAM2000 0.927 TBA 0.910 0.850 0.942 0.86
-
- -
- Baseline DiskANN indices for T2 can be downloaded using "azcopy copy 'https://comp21storage.blob.core.windows.net/publiccontainer/comp21/diskann-T2-baseline-indices' 'local_folder' --recursive". - Note that this would take some time as the indices are large. All indices were built using R and L parameters set to 100. - Search for T2 used 16 threads and beamwidth 4. The Ls parameter was varied to tune recall vs QPS.
- Update: T2 baseline results have been modified after measuring via pybind11 interface on docker. There was a 30-40% QPS loss using this interface - as compared to direct measurements of C++ code from commandline. As a result, the QPS target has now been lowered, and the recall is reported at this threshold. - - -
-

Call for Participation and Timeline

-

- Participation is open to all teams interested in developing new algorithms or re-implementing - existing algorithms more efficiently either in software or hardware. Participants are - requested to submit a brief document through CMT - for each track they will be competing in. The document should contain the following details: -

    -
  • Name, email and affiliation of each participant in the team
  • -
  • A name and/or URL for the submission.
  • -
  • [Optional] To receive Azure credits for developing new ideas, please submit your request - by June 30th with preliminary data on smaller scale datasets and why you think - your algorithm will work well at billion scale. This will be used by the organizers to select strong - entries. We request teams who already have access to infrastructure (e.g. those from industry or - with access to large university clusters) to skip this.
  • -
- - - For Track T3, the document should contain the following additional details to help organizers plan - and assess eligibility for seperate leaderboards: -
    -
  • Type of hardware, e.g., PCIe extension board, rack-mounted system, or other.
  • -
  • Evidence of the retail MSRP of the hardware, i.e., pricing on website or copy of the customer invoice.
  • -
  • If hardware will be sent to GSI Technology (at the participants expense) or if organizers will given remote access to the systems. - For remote system access participants, whether their system supports standard IPMI power monitoring. - If not IPMI, then an equivalent power monitoring interface must be available. -
  • Operating system requirements.
  • -
  • Whether the participant requires a separate machine for index building. We have limited Azure-based - Fsv2-series machines and some bare-metal machines managed by the T3 organizers.
  • -
-

- -

Consent Forms

- Please review and complete the consent form for participation in Tracks T1/T2 - and Track T3. Note that there are separate consent forms - for the standard and custom hardware tracks. Completing the form is necessary for participation. - -

-

Timeline (subject to change)

-
    -
  • May: release of data, guidelines, and a call for participation. Registration open.
  • -
  • June: Baseline results, testing infrastructure and final ranking metrics released.
  • -
  • July 11th: Participants in need of compute resources to submit an expression of interest.
  • -
  • Mid-July: Allocation of compute resources.
  • -
  • July 30th: Final deadline for participants to submit an expression of interest through CMT.
  • -
  • October 22nd: End of competition period. Teams to release of code in a containerized form, and complete a pull request to the eval framework with code to run the algorithms.
  • -
  • October 29th: Participants submit a brief report outlining their algorithm and results.
  • -
  • Mid-November: Release of preliminary results on standardized machines. Review of code by organizers and participants. Participants can raise concerns about the evaluation.
  • -
  • Early December: Final results published, and competition results archived (the competition will go on if interest continues).
  • -
  • During NeurIPS, organizers will provide an overview of the competition and results. Organizers will also request the best entries - (including leaderboard toppers, or promising new approaches) to present an overview for further discussion.
  • -
-

-
- - -
- - + + + + + + +

You will be redirected to NeurIPS'23 page soon!

+ + \ No newline at end of file diff --git a/install.py b/install.py deleted file mode 100644 index fe212da01..000000000 --- a/install.py +++ /dev/null @@ -1,78 +0,0 @@ -import json -import os -import argparse -import subprocess -from multiprocessing import Pool - - -def build(library, args, dockerfile): - print('Building %s...' % library) - if args is not None and len(args) != 0: - q = " ".join(["--build-arg " + x.replace(" ", "\\ ") for x in args]) - else: - q = "" - - try: - command = 'docker build %s --rm -t billion-scale-benchmark-%s -f' \ - % (q, library ) - command += ' install/Dockerfile.%s .' % (library) \ - if not dockerfile else ' %s .' % dockerfile - subprocess.check_call(command, shell=True) - return {library: 'success'} - except subprocess.CalledProcessError: - return {library: 'fail'} - - -def build_multiprocess(args): - return build(*args) - - -if __name__ == "__main__": - parser = argparse.ArgumentParser( - formatter_class=argparse.ArgumentDefaultsHelpFormatter) - parser.add_argument( - "--proc", - default=1, - type=int, - help="the number of process to build docker images") - parser.add_argument( - '--algorithm', - metavar='NAME', - help='build only the named algorithm image', - default=None) - parser.add_argument( - '--dockerfile', - metavar='PATH', - help='build only the image from a Dockerfile path', - default=None) - parser.add_argument( - '--build-arg', - help='pass given args to all docker builds', - nargs="+") - args = parser.parse_args() - - print('Building base image...') - subprocess.check_call( - 'docker build \ - --rm -t billion-scale-benchmark -f install/Dockerfile .', shell=True) - - if args.dockerfile: - tags = [os.path.basename(os.path.dirname(args.dockerfile))] - elif args.algorithm: - tags = [args.algorithm] - elif os.getenv('LIBRARY'): - tags = [os.getenv('LIBRARY')] - else: - tags = [fn.split('.')[-1] for fn in os.listdir('install') if fn.startswith('Dockerfile.') and not 'faissgpu' in fn] - - print('Building algorithm images... with (%d) processes' % args.proc) - - if args.proc == 1: - install_status = [build(tag, args.build_arg, args.dockerfile) for tag in tags ] - else: - pool = Pool(processes=args.proc) - install_status = pool.map(build_multiprocess, [(tag, args.build_arg, args.dockerfile) for tag in tags ]) - pool.close() - pool.join() - - print('\n\nInstall Status:\n' + '\n'.join(str(algo) for algo in install_status)) diff --git a/install/Dockerfile b/install/Dockerfile deleted file mode 100644 index 8b41dd303..000000000 --- a/install/Dockerfile +++ /dev/null @@ -1,13 +0,0 @@ -FROM ubuntu:18.04 - -RUN apt-get update && apt-get install -y python3-numpy python3-scipy python3-pip build-essential git axel wget -RUN wget https://aka.ms/downloadazcopy-v10-linux && mv downloadazcopy-v10-linux azcopy.tgz && tar xzf azcopy.tgz --transform 's!^[^/]\+\($\|/\)!azcopy_folder\1!' -RUN cp azcopy_folder/azcopy /usr/bin - -RUN pip3 install -U pip - -WORKDIR /home/app -COPY requirements.txt run_algorithm.py ./ -RUN pip3 install -r requirements.txt - -ENTRYPOINT ["python3", "-u", "run_algorithm.py"] diff --git a/install/Dockerfile.diskann b/install/Dockerfile.diskann deleted file mode 100644 index 54599646a..000000000 --- a/install/Dockerfile.diskann +++ /dev/null @@ -1,29 +0,0 @@ -FROM billion-scale-benchmark - -RUN apt-get update -RUN apt-get install -y wget git cmake g++ libaio-dev libgoogle-perftools-dev clang-format libboost-dev python3 python3-setuptools python3-pip -RUN pip3 install pybind11 numpy - -RUN cd /tmp && wget https://apt.repos.intel.com/intel-gpg-keys/GPG-PUB-KEY-INTEL-SW-PRODUCTS-2019.PUB -RUN cd /tmp && apt-key add GPG-PUB-KEY-INTEL-SW-PRODUCTS-2019.PUB -RUN cd /tmp && rm GPG-PUB-KEY-INTEL-SW-PRODUCTS-2019.PUB -RUN cd /tmp && sh -c 'echo deb https://apt.repos.intel.com/mkl all main > /etc/apt/sources.list.d/intel-mkl.list' -RUN apt-get update -RUN apt-get install -y intel-mkl-64bit-2020.0-088 - -RUN update-alternatives --install /usr/lib/x86_64-linux-gnu/libblas.so libblas.so-x86_64-linux-gnu /opt/intel/mkl/lib/intel64/libmkl_rt.so 150 -RUN update-alternatives --install /usr/lib/x86_64-linux-gnu/libblas.so.3 libblas.so.3-x86_64-linux-gnu /opt/intel/mkl/lib/intel64/libmkl_rt.so 150 -RUN update-alternatives --install /usr/lib/x86_64-linux-gnu/liblapack.so liblapack.so-x86_64-linux-gnu /opt/intel/mkl/lib/intel64/libmkl_rt.so 150 -RUN update-alternatives --install /usr/lib/x86_64-linux-gnu/liblapack.so.3 liblapack.so.3-x86_64-linux-gnu /opt/intel/mkl/lib/intel64/libmkl_rt.so 150 - -RUN echo "/opt/intel/lib/intel64" > /etc/ld.so.conf.d/mkl.conf -RUN echo "/opt/intel/mkl/lib/intel64" >> /etc/ld.so.conf.d/mkl.conf -RUN ldconfig -RUN echo "MKL_THREADING_LAYER=GNU" >> /etc/environment - -RUN git clone --single-branch --branch python_bindings_diskann https://github.com/microsoft/diskann -RUN mkdir -p diskann/build -RUN cd diskann/build && cmake -DCMAKE_BUILD_TYPE=Release .. -RUN cd diskann/build && make -j -RUN cd diskann/python && pip install -e . -RUN python3 -c 'import diskannpy' diff --git a/install/Dockerfile.elastiknn b/install/Dockerfile.elastiknn deleted file mode 100644 index e69de29bb..000000000 diff --git a/install/Dockerfile.faiss b/install/Dockerfile.faiss deleted file mode 100644 index 191966ab6..000000000 --- a/install/Dockerfile.faiss +++ /dev/null @@ -1,9 +0,0 @@ -FROM billion-scale-benchmark - -RUN apt-get update && apt-get install -y libopenblas-base libopenblas-dev libpython3-dev swig python3-dev libssl-dev wget -RUN wget https://github.com/Kitware/CMake/releases/download/v3.18.3/cmake-3.18.3-Linux-x86_64.sh && mkdir cmake && sh cmake-3.18.3-Linux-x86_64.sh --skip-license --prefix=cmake && rm cmake-3.18.3-Linux-x86_64.sh -RUN git clone https://github.com/facebookresearch/faiss lib-faiss -RUN cd lib-faiss && ../cmake/bin/cmake -DFAISS_OPT_LEVEL=avx2 -DCMAKE_BUILD_TYPE=Release -DFAISS_ENABLE_GPU=OFF -DPython_EXECUTABLE=/usr/bin/python3 -B build . -RUN cd lib-faiss && make -C build -j4 -RUN cd lib-faiss && cd build && cd faiss && cd python && python3 setup.py install && cd && rm -rf cmake -RUN python3 -c 'import faiss; print(faiss.IndexFlatL2)' diff --git a/install/Dockerfile.faissconda b/install/Dockerfile.faissconda deleted file mode 100644 index 914fd0649..000000000 --- a/install/Dockerfile.faissconda +++ /dev/null @@ -1,17 +0,0 @@ -FROM billion-scale-benchmark - -RUN apt update && apt install -y wget -RUN wget https://repo.anaconda.com/archive/Anaconda3-2020.11-Linux-x86_64.sh -RUN bash Anaconda3-2020.11-Linux-x86_64.sh -b - -ENV PATH /root/anaconda3/bin:$PATH - -RUN conda install -c pytorch faiss-cpu -COPY install/requirements_conda.txt ./ -# conda doesn't like some of our packages, use pip -RUN python3 -m pip install -r requirements_conda.txt - -RUN python3 -c 'import faiss; print(faiss.IndexFlatL2)' - - - diff --git a/install/Dockerfile.httpann_example b/install/Dockerfile.httpann_example deleted file mode 100644 index 4b36efd6b..000000000 --- a/install/Dockerfile.httpann_example +++ /dev/null @@ -1,3 +0,0 @@ -FROM billion-scale-benchmark - -RUN python3 -m pip install flask==2.0.1 diff --git a/install/requirements_conda.txt b/install/requirements_conda.txt deleted file mode 100644 index c902620f5..000000000 --- a/install/requirements_conda.txt +++ /dev/null @@ -1,11 +0,0 @@ -ansicolors -docker-py -h5py -matplotlib -numpy -pyyaml -psutil -scipy -scikit-learn -jinja2 -pandas diff --git a/logging.conf b/logging.conf deleted file mode 100644 index 6a4595f12..000000000 --- a/logging.conf +++ /dev/null @@ -1,34 +0,0 @@ -[loggers] -keys=root,annb - -[handlers] -keys=consoleHandler,fileHandler - -[formatters] -keys=simpleFormatter - -[formatter_simpleFormatter] -format=%(asctime)s - %(name)s - %(levelname)s - %(message)s -datefmt= - -[handler_consoleHandler] -class=StreamHandler -level=INFO -formatter=simpleFormatter -args=(sys.stdout,) - -[handler_fileHandler] -class=FileHandler -level=INFO -formatter=simpleFormatter -args=('annb.log','w') - -[logger_root] -level=WARN -handlers=consoleHandler - -[logger_annb] -level=INFO -handlers=consoleHandler,fileHandler -qualname=annb -propagate=0 diff --git a/neurips21.html b/neurips21.html new file mode 100644 index 000000000..d2c6b4d9a --- /dev/null +++ b/neurips21.html @@ -0,0 +1,552 @@ + + + + + + + + Big ANN Benchmarks + + + + + + + + + + + + + + + +
+

Billion-Scale Approximate Nearest Neighbor Search Challenge: NeurIPS'21 competition track

+ +

+ + + + +

Code, Report, Results and Blogs

+ + + +
+

Why this competition?

+ In the past few years, we’ve seen a lot of new research and creative approaches for large-scale ANNS, including: +
    +
  • Partition-based, and graph-based indexing strategies (as well as hybrid indexing approaches).
  • +
  • Mixing RAM and SSD storage to efficiently store and process large datasets that exceed the size of RAM.
  • +
  • Using accelerator hardware such as GPUs, FPGAs, and other custom in-memory silicon.
  • +
  • Leveraging machine learning for dimensionality reduction of the original vectors.
  • +
+

+ In addition to an uptick in academic interest, many implementations of these algorithms at scale now appear in production + and high availability datacenter contexts: powering enterprise-grade, mission-critical, and web-scale search applications. + In these deployment scenarios, benchmarks such as cost, preprocessing time, power consumption become just as important as + the recall-vs-latency tradeoff. Despite this, most empirical evaluations of algorithms have focused on smaller datasets + of about a million points, e.g. ann-bechmarks.com. However, deploying recent algorithmic advances in ANNS techniques for + search, recommendation and ranking at scale requires support at billion or substantially larger scale. Barring a few recent + papers, there is limited consensus on which algorithms are effective at this scale. +

+ + We believe that this challenge will be impactful in several ways: +
    +
  • Provide a comparative understanding of algorithmic ideas and their application at scale.
  • +
  • Promote the development of new techniques for the problem and demonstration of their value.
  • +
  • Provide a compilation of datasets, many new, to enable future development of algorithms.
  • +
  • Introduce a standard benchmarking approach.
  • +
+ By providing a platform for those interested in this problem, we aim to encourge more collaboration and collectively advance the field at a more rapid pace. + Researchers can request Azure compute credit from a pool sponsored by Microsoft Research. +
+ +
+

Tracks

+

Standard Hardware Tracks (T1 and T2)

+

+ There are two standard standard hardware tracks: +

    +
  • Track 1: In-memory indices with FAISS as the baseline. + Search would use Azure Standard_F32s_v2 VMs + with 32 vCPUs and 64GB RAM. Index construction would use Azure + Standard_F64s_v2 VM + with 64vCPUs, 128GB RAM and an additional 4TB of SSD to be used for storing the data, index and other intermediate data.
  • +
  • Track 2: Out-of-core indices with DiskANN as the baseline. + In addition to the limited DRAM in T1, index can use an SSD for search. + Search would use Azure + Standard_L8s_v2 VMs with 8 vCPUS, 64GB RAM and a local SSD Index constrained to 1TB. + Construction would use Azure + Standard_F64s_v2 VM + with 64vCPU, 128GB RAM and an additional 4TB of SSD to be used for storing the data, index and other intermediate data.
  • +
+ Participants are expected to release their code for index building and search which the organizers will run on separate machines. + Participants provide a configuration for their index build code that would complete in 4 days for each dataset. + The protocol for evaluation is as follows: +
    +
  • [on indexing machine] participants will be given a local path with 1B vector dataset.
  • +
  • [on indexing machine] participants build an index from the 1B vectors and store back to local disk.
  • +
  • [on indexing machine] Stored index is copied out to a temporary cloud storage location by the eval framework.
  • +
  • [on search machine] organizers load the index from cloud storage to a local path and provide the path to the search code.
  • +
  • [on search machine] organizers perform searches with held-out query set and measure recall and time to process the queries with several sets of parameters.
  • +
+

+ + Finalized details for build and search hardware timing will be released along with the the eval framework. + +

Custom Hardware Track (T3)

+

+ Participants can use non-standard hardware such as GPUs, AI accelerators, FPGAs, and custom in-memory silicon. + In this track, participants will either 1) send their hardware, such as PCI boards to GSI Technology or 2) evaluate + themselves using the scripts made available by the organizers. For T3 participants sending hardware, + we will make specific delivery arrangements at participant’s expense. We will install the hardware on a system under + the organizers control (we have a few bare-metal options available) and follow any installation directions provided. + Participants will be allowed to temporarily log into the machine to finalize any installation and configuration, + or for debugging installation as needed. For T3 participants running the evaluation themselves, we request remote ssh + access and sudo accounts on the systems so that the organizers can verify the system and hardware (such as IPMI support, + minimum resource availability such as disk storage for datasets). + + The evaluation phase will proceed like T1/T2, with a few modifications. +

    +
  • For participants that send their hardware, T3 organizers will provide remote access to a separate indexing machine. +
      +
    • [on separate indexing machine] participants download 1B vector dataset and store to local disk
    • +
    • [on separate indexing machine] participants build an index from the 1B vectors and store back to local disk
    • +
    • Stored index is copied to eval machine
    • +
    • [on eval machine] T3 organizers load the index from local disk
    • +
    • [on eval machine] T3 organizers provide index with held-out query set and measure recall and time to process the queries with several sets of parameters. + Index search code can use internal parallelism to batch process the queries.
    • +
    +
  • +
  • For participants that give us remote access to systems, participants are responsible for building their index. +
      +
    • [on indexing machine] participants download 1B vector dataset and store to local disk
    • +
    • [on indexing machine] participants build an index from the 1B vectors and store back to local disk
    • +
    • Stored index is copied to eval machine
    • +
    • [on eval machine] T3 organizers load the index from local disk
    • +
    • [on eval machine] T3 organizers perform searches with held-out query set and measure recall and search time with several sets of parameters.
    • +
    +
  • +
+ + T3 will maintain different leaderboards for each dataset based on the following benchmarks: +
    +
  • Recall vs throughput using the same ranking formula as the T1/T2 track
  • +
  • Power- recall vs throughput/watt and a similar ranking formula to the T1/T2 track.
  • +
  • Cost measured as cost/watt (measured as queries/second/watt and MSRP/watt)
  • +
  • Total cost normalized across all tracks.
  • +
+ We will provide the exact details on how we collect and compute these benchmarks as well as additional machine and operating system specification before the competition begins. +

+
+ +
+

Benchmark Datasets

+ We intend to use the following 6 billion point datasets. +
    +
  • BIGANN consists of SIFT descriptors applied to images from extracted from a large image dataset.
  • +
  • Facebook SimSearchNet++ is a new dataset released by Facebook for this competition. + It consists of features used for image copy detection for integrity purposes. + The features are generated by Facebook SimSearchNet++ model.
  • +
  • Microsoft Turing-ANNS-1B is a new dataset being released by the Microsoft Turing team for this competition. + It consists of Bing queries encoded by Turing AGI v5 that trains Transformers to capture similarity of intent in + web search queries. An early version of the RNN-based AGI Encoder is described in a + SIGIR'19 paper and a blogpost.
  • +
  • Microsoft SPACEV-1B is a new web search related dataset + released by Microsoft Bing for this competition. + It consists of document and query vectors encoded by Microsoft SpaceV Superior model to capture generic intent representation.
  • +
  • Yandex DEEP-1B image descriptor dataset consisting of the projected + and normalized outputs from the last fully-connected layer of the GoogLeNet model, which was pretrained on the Imagenet classification task.
  • +
  • Yandex Text-to-Image-1B is a new cross-model dataset (text and visual), + where database and query vectors have different distributions in a shared representation space. The base set consists of Image embeddings produced by the + Se-ResNext-101 model, and queries are textual embeddings produced by a variant of the DSSM model. Since the distributions are different, a 50M sample + of the query distribution is provided.
  • +
+ +

+ All datasets are in the common binary format that starts with 8 bytes of data consisting of num_points(uint32_t) + num_dimensions(uint32) followed by num_pts X num_dimensions x sizeof(type) bytes of data stored one vector after another. Data files + will have suffixes .fbin, .u8bin, and .i8bin to represent float32, uint8 and int8 type data. Note that a different query set + will be used for evaluation. The details of the datasets along with links to the base, query and sample sets, and the ground truth nearest neighbors + of the query set are listed below. +

+ +

+ The ground truth binary files for k-NN search consist of the following information: num_queries(uint32_t) + K-NN(uint32) followed by num_queries X K x sizeof(uint32_t) bytes of data representing the IDs of the K-nearest neighbors of the + queries, followed by num_queries X K x sizeof(float) bytes of data representing the distances to the corresponding points. The distances + help identify neighbors tied in terms of distances. In recall calculation, returning a neighbor not in the ground truth set but whose distance is tied + with an entry in the ground truth is counted as success. +

+

+ The ground truth binary files for range search consist of the following information: num_queries(int32_t) followed by the total number + of results total_res(int32_t) followed + by num_queries X size(int32_t) bytes corresponding to num_results_per_query for each query, followed by total_res X sizeof(int32_t) + bytes corresponding to the IDs of the neighbors of each query one after the other. +

+

+ The ground truth files for the first 10M slice, the first 100M slice, and the complete 1B set of each dataset against the respective query set can be downloaded + here(10M), + here(100M), and + here(1B). +

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
Dataset Datatype Dimensions Distance Range/k-NN Base data Sample data Query data Ground truth Release terms
BIGANN uint8 128 L2 k-NN 1B points 100M base points 10K queries link CC0
Facebook SimSearchNet++* uint8 256 L2 Range 1B points N/A 100k queries link CC BY-NC
Microsoft Turing-ANNS* float32 100 L2 k-NN 1B points N/A 100K queries link link to terms
Microsoft SPACEV* int8 100 L2 k-NN 1B points 100M base points 29.3K queries link O-UDA
Yandex DEEP float32 96 L2 k-NN 1B points 350M base points 10K queries link CC BY 4.0
Yandex Text-to-Image* float32 200 inner-product k-NN 1B points 50M queries 100K queries link CC BY 4.0
+ * new datasets
+ We recommend using Axel for downloading BIGANN, Facebook-SSN++, Yandex DEEP1B and T2I datasets.
+ We recommend using AzCopy for downloading Microsoft datasets. +
+ +
+

Metrics

+ The competition will measure recall@10 of the algorithms on the 6 data sets a private query set (unreleased) at a fixed query throughput. + Track T1 measures recall of algorithms at 10000 Queries/second (on 32 vCPUs), T2 measures recall at 1500 Queries/second, T2 measures recall at 2000 Queries/second. + The primary metric for comparison in each track will be the sum of improvements in recall over the baseline at the target QPS over all datasets. + Additionally, track T3 will also rank entries by power and cost per query. See this + notebook + for power and cost analysis. + A team has to publish an algorithm and commit to benchmarking on at least 3 datasets to be considered for ranking. Recall regression on a dataset selected + by a team will be continued as a negative score. + The recall@10(AP for SSN++-1B dataset) of the baseline algorithms on each dataset for the public query set is listed below. + + + + + + + + + + + + + + + + + +
Track Algorithm Search MachineTarget Queries/secBIGANN-1B SSN++-1B Turing-ANNS-1B SPACEV-1B DEEP-1B Text-to-Image-1B
Track 1 FAISS-CPU Azure F32s_v2 32vCPUs + 64GB RAM10000 0.634 0.753 0.703 0.728 0.650 0.069
Track 2 DiskANN Azure L8s_v2 8vCPUs + 64GB RAM + 1TB SSD 1500 0.949 0.16274 0.936 0.901 0.937 0.488
Track 3 FAISS-GPU NVIDIA V100 + 700GB RAM2000 0.927 TBA 0.910 0.850 0.942 0.86
+
+ +
+ Baseline DiskANN indices for T2 can be downloaded using "azcopy copy 'https://comp21storage.blob.core.windows.net/publiccontainer/comp21/diskann-T2-baseline-indices' 'local_folder' --recursive". + Note that this would take some time as the indices are large. All indices were built using R and L parameters set to 100. + Search for T2 used 16 threads and beamwidth 4. The Ls parameter was varied to tune recall vs QPS.
+ Update: T2 baseline results have been modified after measuring via pybind11 interface on docker. There was a 30-40% QPS loss using this interface + as compared to direct measurements of C++ code from commandline. As a result, the QPS target has now been lowered, and the recall is reported at this threshold. + + +
+

Call for Participation and Timeline

+

+ Participation is open to all teams interested in developing new algorithms or re-implementing + existing algorithms more efficiently either in software or hardware. Participants are + requested to submit a brief document through CMT + for each track they will be competing in. The document should contain the following details: +

    +
  • Name, email and affiliation of each participant in the team
  • +
  • A name and/or URL for the submission.
  • +
  • [Optional] To receive Azure credits for developing new ideas, please submit your request + by June 30th with preliminary data on smaller scale datasets and why you think + your algorithm will work well at billion scale. This will be used by the organizers to select strong + entries. We request teams who already have access to infrastructure (e.g. those from industry or + with access to large university clusters) to skip this.
  • +
+ + + For Track T3, the document should contain the following additional details to help organizers plan + and assess eligibility for seperate leaderboards: +
    +
  • Type of hardware, e.g., PCIe extension board, rack-mounted system, or other.
  • +
  • Evidence of the retail MSRP of the hardware, i.e., pricing on website or copy of the customer invoice.
  • +
  • If hardware will be sent to GSI Technology (at the participants expense) or if organizers will given remote access to the systems. + For remote system access participants, whether their system supports standard IPMI power monitoring. + If not IPMI, then an equivalent power monitoring interface must be available. +
  • Operating system requirements.
  • +
  • Whether the participant requires a separate machine for index building. We have limited Azure-based + Fsv2-series machines and some bare-metal machines managed by the T3 organizers.
  • +
+

+ +

Consent Forms

+ Please review and complete the consent form for participation in Tracks T1/T2 + and Track T3. Note that there are separate consent forms + for the standard and custom hardware tracks. Completing the form is necessary for participation. + +

+

Timeline (subject to change)

+
    +
  • May: release of data, guidelines, and a call for participation. Registration open.
  • +
  • June: Baseline results, testing infrastructure and final ranking metrics released.
  • +
  • July 11th: Participants in need of compute resources to submit an expression of interest.
  • +
  • Mid-July: Allocation of compute resources.
  • +
  • July 30th: Final deadline for participants to submit an expression of interest through CMT.
  • +
  • October 22nd: End of competition period. Teams to release of code in a containerized form, and complete a pull request to the eval framework with code to run the algorithms.
  • +
  • October 29th: Participants submit a brief report outlining their algorithm and results.
  • +
  • Mid-November: Release of preliminary results on standardized machines. Review of code by organizers and participants. Participants can raise concerns about the evaluation.
  • +
  • Early December: Final results published, and competition results archived (the competition will go on if interest continues).
  • +
  • During NeurIPS, organizers will provide an overview of the competition and results. Organizers will also request the best entries + (including leaderboard toppers, or promising new approaches) to present an overview for further discussion.
  • +
+

+
+ + +
+

Summary of NeurIPS'21 event

+ The NeurIPS session for this competition happend on Dec 8, 2021. See slides and recordings of the talks below. + Overview Talk and Break-out session schedule (GMT). +
    +
  • 11:05-11:25: Overview Talk (slides, video)
  • +
  • 12:00-12:45: Overview of results presented by organizers, followed by Q&A
  • +
      +
    • Standard hardware tracks T1 and T2 results (slides)
    • +
    • Custom hardware track T3 results (slides)
    • +
    +
  • 12:45-13:20: Invited talk 1 by Prof. Alexandr Andoni: Learning to Hash Robustly, with Guarantees (slides, video)
  • +
  • 13:20-13:55: Invited talk 2 by Prof. Anshumali Shrivastava:Iterative Repartitioning for Learning to Hash and the Power of k-Choices (slides, video)
  • +
  • 13:55-14:30: Talks from track winners. +
      +
    • Track 1: kst_ann_t1 Li Liu, Jin Yu, Guohao Dai, Wei Wu, Yu Qiao, Yu Wang, Lingzhi Liu, Kuaishou Technology and Tsinghua University (video)
    • +
    • Track 2: BBANN Xiaomeng Yi, Xiaofan Luan, Weizhi Xu, Qianya Cheng, Jigao Luo, Xiangyu Wang, Jiquan Long, Xiao Yan, Zheng Bian, Jiarui Luo, Shengjun Li, Chengming Li, Zilliz and Southern University of Science and Technology (slides, video)
    • +
    • Track 3: OptaNNe Sourabh Dongaonkar, Mark Hildebrand, Mariano Tepper, Cecilia Aguerrebere, Ted Willke, Jawad Khan, Intel Corporation, Intel Labs and UC Davis (slides, video)
    • +
    +
  • +
  • 14:30-15:00: Open discussion on competition and future directions (github thread, video)
  • +
+

+ Abstract for Invited talk: "Learning to Hash Robustly, with Guarantees"
+ There is a gap between the high-dimensional nearest neighbor search + (NNS) algorithms achieving the best worst-case guarantees and the + top-performing ones in practice. The former are based on indexing via + the randomized Locality Sensitive Hashing (LSH), and its + derivatives. The latter "learn" the best indexing method in order to + speed-up NNS, crucially adapting to the structure of the given + dataset. Alas, the latter also almost always come at the cost of + losing the guarantees of either correctness or robust performance on + adversarial queries (or apply to datasets with an assumed extra + structure/model). + + How can we bridge these two perspectives and bring the best of both + worlds? As a step in this direction, we will talk about an NNS algorithm + that has worst-case guarantees essentially matching that of + theoretical algorithms, while optimizing the hashing to the structure + of the dataset (think instance-optimal algorithms) for performance on + the minimum-performing query. We will discuss the algorithm's ability + to optimize for a given dataset from both theoretical and practical + perspective. +

+ +

+ Abstract for Invited talk: "Iterative Repartitioning for Learning to Hash and the Power of k-Choices"
+ Dense embedding models are commonly deployed in commercial + search engines, wherein all the vectors are pre-computed, and + near-neighbor search (NNS) is performed with the query vector to find + relevant documents. However, the bottleneck of indexing a large number + of dense vectors and performing an NNS hurts the query time and + accuracy of these models. In this talk, we argue that high-dimensional + and ultra-sparse embedding is a significantly superior alternative to + dense low-dimensional embedding for both query efficiency and + accuracy. Extreme sparsity eliminates the need for NNS by replacing + them with simple lookups, while its high dimensionality ensures that + the embeddings are informative even when sparse. However, learning + extremely high dimensional embeddings leads to blow-up in the model + size. To make the training feasible, we propose a partitioning + algorithm that learns such high-dimensional embeddings across multiple + GPUs without any communication. We theoretically prove that our way of + one-sided learning is equivalent to learning both query and label + embeddings. We call our novel system designed on sparse embeddings as + IRLI (pronounced `early'), which iteratively partitions the items by + learning the relevant buckets directly from the query-item relevance + data. Furthermore, IRLI employs a superior power-of-k-choices based + load balancing strategy. We mathematically show that IRLI retrieves + the correct item with high probability under very natural assumptions + and provides superior load balancing. IRLI surpasses the best + baseline's precision on multi-label classification while being 5x + faster on inference. For near-neighbor search tasks, the same method + outperforms the state-of-the-art Learned Hashing approach NeuralLSH by + requiring only ~ {1/6}^th of the candidates for the same recall. IRLI + is both data and model parallel, making it ideal for distributed GPU + implementation. We demonstrate this advantage by indexing 100 million + dense vectors and surpassing the popular FAISS library by >10%. +

+
+ + + +
+ + diff --git a/neurips23.html b/neurips23.html new file mode 100644 index 000000000..0265b2f76 --- /dev/null +++ b/neurips23.html @@ -0,0 +1,630 @@ + + + + + + + + + + + + NeurIPS'23 Competition Track: Big-ANN + + + + + + + + + + +
+ +
+ + +
+ +
+
+
+ + +

+ NeurIPS'23 Competition Track: + Big-ANN +

+
+ +

+ Supported by + + + + +

+ +
+

+ New: the latest ongoing leaderboard has been released (March 1st, 2024).
Top entries:
+

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
Filter trackOOD trackSparse track
RankAlgorithmQPS@90% recallRankAlgorithmQPS@90% recallRankAlgorithmQPS@90% recall
1Pinecone-filter85,4911Pinecone-ood38,0881Zilliz10,749
2Zilliz84,5962Zilliz33,2412Pinecone_smips10,440
3ParlayANN IVF237,9023RoarANN22,5553PyANNS8,732
4Puck19,1934PyANNS22,2964shnsw7,137
... ... ... ... ... ... ... ... ...
BaselineFAISS3,032BaselineDiskann4,133BaselineLinscan93
+

+ Note: entries by pinecone and zilliz are not open source. +
+

+

+
+ + +

+ This challenge is to encourage the development of indexing data + structures and search algorithms for practical variants of + the Approximate Nearest Neighbor (ANN) or Vector search problem. + These variants are increasingly relevant as vector search becomes commonplace. + This challenge has four tracks covering sparse, + filtered, out-of-distribution and streaming variants of ANNS. These + variants require adapted search algorithms and strategies with + different tradeoffs. Participants are encouraged to develop and + submit new algorithms that improve on the baselines for these + variants. This competition aims at being accessible to participants + by limiting the scale of the datasets to about 10 million points. +

+ + + + + + + + + + + + + + +
+
+ + + +
+
+
+

+ Tracks: Datasets, Metrics and Baselines +

+ +

+ The evaluation hardware is normalized to Azure Standard D8lds v5 + (8 vCPUs and 16GB DRAM). The index build time on this machine + will be limited to 12 hours, + except for streaming index which has stricter time limits. +

+

+ The challenge consists of 4 tracks with separate leaderboards and + participants can choose to submit entries to one or more tracks: +

+
+ +
    +
  • + Filtered Search: This task will use a random 10M slice of the YFCC + 100M dataset transformed with CLIP embeddings. In addition, we + associate with each image a "bag" of tags: words extracted from + the description, the camera model, the year the picture was taken + and the country. The tags are from a vocabulary of 200386 possible + tags. The 100,000 queries consist of one image embedding and one + or two tags that must appear in the database elements to be + considered. +
  • +
  • + Out-Of-Distribution: This task will use the Yandex Text-to-Image + 10M, cross-modal dataset where the database and query index have + different distributions in the shared vector space. The base set + is a 10M subset of the Yandex visual search database of + 200-dimensional image embeddings which are produced with the + Se-ResNext-101 model. The query embeddings correspond to the + user-specified textual search queries. The text embeddings are + extracted with a variant of the DSSM model. +
  • +
  • + Sparse: This task is based on the common MSMARCO passage retrieval + dataset, which has 8,841,823 text passages, encoded into sparse + vectors using the SPLADE model. The vectors have a large dimension + (about 30,000), but each vector in the base dataset has an average + of approximately 120 nonzero elements. The query set contains + 6,980 text queries, embedded by the same SPLADE model. The average + number of nonzero elements in the query set is approximately 49 + (since text queries are generally shorter). Given a sparse query + vector, the index should return the top-k results according to the + maximal inner product between the vectors. +
  • +
  • + Streaming Search: This task uses 30M slice of the MS Turing data + set released in the previous challenge. The index starts with zero + points and must implement the "runbook" provided -- a sequence of + insertion, deletion, and search operations (roughly 4:4:1 ratio) -- + within a time bound of 1 hour and 8GB DRAM. The intention + is for the algorithm to process the operations and maintain a compact + index over the active points rather than index the entire anticipated + set of points and use tombstones or flags to mark active elements. + More details to come. The runbook is provided in `final_runbook.yaml` + which is generated with `final_runbook_gen.py`. +
  • +
+ +
+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
TrackDatasetDimensionsData typeBaseline algoQPS @ 90% recallRelease terms
FilteredYFCC-10M + CLIP192uint8filter-FAISS3200 + CC BY 4.0 +
OODText2Image-10M200float32diskann4882 + CC BY 4.0 +
SparseMS MARCO / SPLADE~30Kfloat32, sparse formatLinscan101 + MS-MARCO: + Free NC
+ SPLADE: + CC BY NC SA +
StreamingMSTuring-30M-clustered100float32fresh-diskann0.883 recall@10 (45mins) + O-UDA +
+
+ + + We recommend using Axel for downloading + non-Microsoft + datasets. We recommend using AzCopy for + downloading + Microsoft datasets. + +
+
+ + + + +
+
+
+

Track Winners and Presentations

+
+ +

Filtered Search

+
    +
  • + ParlayANN IVF2: + Fusing Classic and Spatial Inverted Indices for Fast Filtered ANNS + [slides] + Authors: Ben Landrum (UMD), Magdalen Dobson Manohar (CMU), Mazin Karjikar (UMD), Laxman Dhulipala (UMD) +
  • +
+ +

Out-Of-Distribution

+
    +
  • + RoarANN: Projected Bipartite Graph for Efficient Cross-Modal Approximate Nearest Neighbor Search + Authors: Meng Chen, Yue Chen, Rui Ma, Kai Zhang, Yuzheng Cai, Jiayang Shi, Yizhuo Chen, Weiguo Zheng. All authors from Fudan University. +
  • + +
  • + PyANNS + Authors: Zihao Wang, Shanghai Jiao Tong University* +
  • +
+ +

Sparse

+
    +
  • + PyANNS + Authors: Zihao Wang, Shanghai Jiao Tong University* +
  • +
  • + GrassRMA: GRAph-based Sparse Vector Search with Reducing Memory Accesses
    + Authors: Meng Chen, Yue Chen, Rui Ma, Kai Zhang, Yuzheng Cai, Jiayang Shi, Yizhuo Chen, Weiguo Zheng. All authors from Fudan University. +
  • +
+ +

Streaming Search

+
    +
  • + Puck: + Efficient Multi-level Index Structure for Approximate Nearest Neighbor Search in Practice + [slides] + Authors: Jie Yin, Ben Huang, Baidu. +
  • +
+

+ * Zihao Wang is also an employee of Zilliz. However, he declares that the PyANNs entry was created on his time off, without any involvement from Zilliz or any of the other organizers. This entry did not declare conflict with organizers before participating. + +

Organizer Presentations

+ + + +

Invited Talks

+ + +
+
+ + +
+
+

Participation

+ + +
+

Guidelines

+ +
    +
  • + To participate, please express + interest through the CMT portal. +
  • +
  • + To request cloud compute credits + ($1000) towards development, please select the "Requesting cloud + credit" field in your CMT entry and share a brief overview of + the ideas you plan to develop with these credits in your CMT + entry. +
  • + +
  • + To get started, please see the + instructions in the README + file, and submit a Pull Request + corresponding to your algorithm(s). +
  • + +
  • + For questions and discussions, please + use the Github issues or the Discord channel. +
  • +
+
+ + +
+

Timeline (subject to change)

+ +
    +
  • + June: Baseline results, testing + infrastructure, CFP and final ranking metrics released. +
  • +
  • + End-JulyAugust 30th: Suggested deadline for requesting allocation of cloud + compute credits for development. Credits will be provided on ongoing basis. +
  • +
  • + August 30thSeptember 15th: Final deadline for + participants to submit an expression of interest through CMT. +
  • +
  • + October 30th: End of competition + period. Teams to release code in a containerized form, and + complete a pull request to the eval framework with code to run + the algorithms. +
  • +
  • + Mid-November: Release of preliminary + results on standardized machines. Review of code by organizers + and participants. Participants can raise concerns about the + evaluation. +
  • +
  • + Early December: Final results + published, and competition results archived (the competition + will go on if interest continues). +
  • +
  • + During NeurIPS: Organizers will + provide an overview of the competition and results. Organizers + will also request the best entries (including leaderboard + toppers, or promising new approaches) to present an overview for + further discussion. +
  • +
+
+
+
+ + +
+
+
+

Organizers and Dataset Contributors

+ +

+ Organizers can be reached at + big-ann-organizers@googlegroups.com. We thank + Microsoft Research, Meta, Pinecone, Yandex, and Zilliz + for help in preparing and organizing this competition. We thank + Microsoft for cloud credits towards running the competition, + and AWS and Pinecone for compute credits for participants. +

+
+ + + +

+ Supported by + + + +

+
+
+
+ + + + + + diff --git a/neurips23_slides/ANNS_for_recommendation_systems_Yury.pdf b/neurips23_slides/ANNS_for_recommendation_systems_Yury.pdf new file mode 100644 index 000000000..0335d9021 Binary files /dev/null and b/neurips23_slides/ANNS_for_recommendation_systems_Yury.pdf differ diff --git a/neurips23_slides/IVF_2_filter_Ben.pdf b/neurips23_slides/IVF_2_filter_Ben.pdf new file mode 100644 index 000000000..b3c7321e3 Binary files /dev/null and b/neurips23_slides/IVF_2_filter_Ben.pdf differ diff --git a/neurips23_slides/NVIDIA_Corey.pdf b/neurips23_slides/NVIDIA_Corey.pdf new file mode 100644 index 000000000..d834238e8 Binary files /dev/null and b/neurips23_slides/NVIDIA_Corey.pdf differ diff --git a/neurips23_slides/intro.pptx b/neurips23_slides/intro.pptx new file mode 100644 index 000000000..98b7909a7 Binary files /dev/null and b/neurips23_slides/intro.pptx differ diff --git a/neurips23_slides/streaming_puck_baidu.pptx b/neurips23_slides/streaming_puck_baidu.pptx new file mode 100644 index 000000000..7d77a2748 Binary files /dev/null and b/neurips23_slides/streaming_puck_baidu.pptx differ diff --git a/neurips23_slides/summary.pdf b/neurips23_slides/summary.pdf new file mode 100644 index 000000000..1864f5bf8 Binary files /dev/null and b/neurips23_slides/summary.pdf differ diff --git a/notebooks/check_1B_groundtruth.ipynb b/notebooks/check_1B_groundtruth.ipynb deleted file mode 100644 index 497f7dbd6..000000000 --- a/notebooks/check_1B_groundtruth.ipynb +++ /dev/null @@ -1,365 +0,0 @@ -{ - "cells": [ - { - "cell_type": "code", - "execution_count": 1, - "id": "4011807d", - "metadata": {}, - "outputs": [], - "source": [ - "import sys\n", - "import numpy as np" - ] - }, - { - "cell_type": "code", - "execution_count": 2, - "id": "45df07dc", - "metadata": {}, - "outputs": [], - "source": [ - "sys.path.append(\"..\")\n", - "from benchmark import datasets" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "a4d10abc", - "metadata": {}, - "outputs": [], - "source": [] - }, - { - "cell_type": "code", - "execution_count": 6, - "id": "0d64ca07", - "metadata": {}, - "outputs": [], - "source": [ - "# the ground-truth files on https://big-ann-benchmarks.com/\n", - "\n", - "\n", - "new_gt = {\n", - " 'bigann-1B': \"https://comp21storage.blob.core.windows.net/publiccontainer/comp21/bigann/public_query_gt100.bin\", \n", - " \"ssnpp-1B\": \"https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/FB_ssnpp_public_queries_GT.rangeres\",\n", - " 'msturing-1B': \"https://comp21storage.blob.core.windows.net/publiccontainer/comp21/MSFT-TURING-ANNS/query_gt100.bin\",\n", - " \"msspacev-1B\": \"https://comp21storage.blob.core.windows.net/publiccontainer/comp21/spacev1b/public_query_gt100.bin\", \n", - " \"deep-1B\": \"https://storage.yandexcloud.net/yandex-research/ann-datasets/deep_new_groundtruth.public.10K.bin\", \n", - " \"text2image-1B\": \"https://storage.yandexcloud.net/yandex-research/ann-datasets/t2i_new_groundtruth.public.100K.bin\",\n", - "}\n" - ] - }, - { - "cell_type": "code", - "execution_count": 22, - "id": "4dd26410", - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "Dataset BigANNDataset in dimension 128, with distance euclidean, search_type knn, size: Q 10000 B 1000000000\n", - "Dataset SSNPPDataset in dimension 256, with distance euclidean, search_type range, size: Q 100000 B 1000000000\n", - "Dataset MSTuringANNS in dimension 100, with distance euclidean, search_type knn, size: Q 100000 B 1000000000\n", - "Dataset MSSPACEV1B in dimension 100, with distance euclidean, search_type knn, size: Q 29316 B 1000000000\n", - "Dataset Deep1BDataset in dimension 96, with distance euclidean, search_type knn, size: Q 10000 B 1000000000\n", - "Dataset Text2Image1B in dimension 200, with distance ip, search_type knn, size: Q 100000 B 1000000000\n" - ] - } - ], - "source": [ - "# get official GT file \n", - "\n", - "\n", - "for dsname in new_gt: \n", - " ds = datasets.DATASETS[dsname]()\n", - " print(ds)\n", - " \n", - " data = urllib.request.urlopen(new_gt[dsname]).read()\n", - " open(f\"/tmp/new_GT/{dsname}\", \"wb\").write(data)\n", - " \n", - " " - ] - }, - { - "cell_type": "code", - "execution_count": 109, - "id": "c0c2545b", - "metadata": {}, - "outputs": [], - "source": [ - "def count_diff_1_result(Dref, Iref, Dnew, Inew, eps): \n", - " \"\"\" compare knn search results. Intended to normalize for: \n", - " - small variations of the distance measure (below eps)\n", - " - ordering of ties\n", - " \"\"\"\n", - " if not np.all(Dref == Dnew): \n", - " assert np.abs(Dref - Dnew).max() < eps\n", - " # attempt to do some normalization to merge nearby distances \n", - " Dref = np.floor(np.minimum(Dref, Dnew) / eps) * eps \n", - " \n", - " ndiff = 0\n", - " cur_d = -1e10\n", - " s_ref = set()\n", - " s_new = set()\n", - " for j in range(len(Iref)): \n", - " if Dref[j] != cur_d: \n", - " nd = len(s_ref ^ s_new)\n", - " ndiff += nd\n", - " if nd > 0: \n", - " pass\n", - " # print(i, cur_d, s_ref, s_new)\n", - " s_ref = set()\n", - " s_new = set()\n", - " cur_d = Dref[j]\n", - " s_ref.add(Iref[j])\n", - " s_new.add(Inew[j]) \n", - " return ndiff\n", - "\n", - "def compare_knn_res(Dref, Iref, Dnew, Inew): \n", - "\n", - " ndiff = 0\n", - " eps = Dref.max() * 1e-5\n", - " for i in range(len(Iref)):\n", - " \n", - " if np.all(Iref[i] == Inew[i]): \n", - " continue\n", - " \n", - " ndiff += count_diff_1_result(Dref[i], Iref[i], Dnew[i], Inew[i], eps)\n", - " \n", - "\n", - " return ndiff" - ] - }, - { - "cell_type": "code", - "execution_count": 110, - "id": "af4affa2", - "metadata": { - "scrolled": false - }, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "bigann-1B Dataset BigANNDataset in dimension 128, with distance euclidean, search_type knn, size: Q 10000 B 1000000000\n", - "raw_diff=0.9899 % diff=0.0 %\n", - "(10000, 100) (10000, 100)\n", - "ssnpp-1B Dataset SSNPPDataset in dimension 256, with distance euclidean, search_type range, size: Q 100000 B 1000000000\n", - "(7706752,) (7706752,)\n", - "msturing-1B Dataset MSTuringANNS in dimension 100, with distance euclidean, search_type knn, size: Q 100000 B 1000000000\n", - "raw_diff=0.0195 % diff=0.00024 %\n", - "(100000, 100) (100000, 100)\n", - "msspacev-1B Dataset MSSPACEV1B in dimension 100, with distance euclidean, search_type knn, size: Q 29316 B 1000000000\n", - "raw_diff=24.181163869559285 % diff=0.0 %\n", - "(29316, 100) (29316, 100)\n", - "deep-1B Dataset Deep1BDataset in dimension 96, with distance euclidean, search_type knn, size: Q 10000 B 1000000000\n", - "raw_diff=0.1864 % diff=0.0002 %\n", - "(10000, 100) (10000, 100)\n", - "text2image-1B Dataset Text2Image1B in dimension 200, with distance ip, search_type knn, size: Q 100000 B 1000000000\n", - "raw_diff=0.04773 % diff=0.0 %\n", - "(100000, 100) (100000, 100)\n" - ] - } - ], - "source": [ - "# compare with what I computed \n", - "new_basedir = \"/checkpoint/matthijs/billion-scale-ann-benchmarks/GT_1B/\"\n", - "\n", - "for dsname in new_gt: \n", - " ds = datasets.DATASETS[dsname]()\n", - " print(dsname, ds)\n", - " if ds.search_type() == \"knn\": \n", - " Iref, Dref = datasets.knn_result_read(f\"/tmp/new_GT/{dsname}\")\n", - " Inew, Dnew = datasets.knn_result_read(f\"{new_basedir}/{dsname}\")\n", - " raw_ndiff = (Iref != Inew).sum()\n", - " ndiff = compare_knn_res(Dref, Iref, Dnew, Inew) \n", - " print(f\"raw_diff={100 * raw_ndiff/ Iref.size} % diff={100 * ndiff/ Iref.size} %\")\n", - " \n", - " else: \n", - " nres_ref, Iref, Dref = datasets.range_result_read(f\"/tmp/new_GT/{dsname}\")\n", - " nres_new, Inew, Dnew = datasets.range_result_read(f\"{new_basedir}/{dsname}\")\n", - " # does not make much sense to verify, they are computed simultaneously\n", - " \n", - " print(Iref.shape, Inew.shape)\n", - " \n", - " \n", - " " - ] - }, - { - "cell_type": "markdown", - "id": "8b100230", - "metadata": {}, - "source": [ - "# Check subsets -- range" - ] - }, - { - "cell_type": "markdown", - "id": "a069dc1d", - "metadata": {}, - "source": [ - "Make sure the 10M and 100M results are a subset of 1B" - ] - }, - { - "cell_type": "code", - "execution_count": 91, - "id": "fd4bebff", - "metadata": {}, - "outputs": [], - "source": [ - "dsname = \"ssnpp-1B\"" - ] - }, - { - "cell_type": "code", - "execution_count": 92, - "id": "1ba55156", - "metadata": {}, - "outputs": [], - "source": [ - "new_basedir = \"/checkpoint/matthijs/billion-scale-ann-benchmarks/GT_1B/\"\n", - "\n", - "nres_ref, Iref, Dref = datasets.range_result_read(f\"/tmp/new_GT/{dsname}\")\n", - "nres_new, Inew, Dnew = datasets.range_result_read(f\"{new_basedir}/{dsname}\")" - ] - }, - { - "cell_type": "code", - "execution_count": 98, - "id": "2f570eb7", - "metadata": {}, - "outputs": [], - "source": [ - "for nb, ss in [(10 ** 7, \"10M\"), (10 ** 8, \"100M\")]: \n", - " ds_sub = dsname.replace(\"1B\", ss)\n", - " nres_sub, Isub, Dsub = datasets.range_result_read(f\"/checkpoint/matthijs/billion-scale-ann-benchmarks/GT_{ss}/{ds_sub}\")\n", - " \n", - " nq = len(nres_ref)\n", - " assert len(nres_sub) == nq\n", - " i0 = j0 = 0\n", - " for i in range(nq): \n", - " i1 = i0 + nres_ref[i]\n", - " j1 = j0 + nres_sub[i]\n", - "\n", - " ref_res = Iref[i0:i1]\n", - " sub_res = Isub[j0:j1]\n", - "\n", - " ref_res_sub = ref_res[ref_res < nb]\n", - " assert set(ref_res_sub) == set(sub_res)\n", - "\n", - " i0 = i1\n", - " j0 = j1\n", - " " - ] - }, - { - "cell_type": "markdown", - "id": "eed490b8", - "metadata": {}, - "source": [ - "# Check subsets -- knn" - ] - }, - { - "cell_type": "markdown", - "id": "b4b5f7a9", - "metadata": {}, - "source": [ - "Make sure the 10M and 100M results are a subset of 1B in knn sense " - ] - }, - { - "cell_type": "code", - "execution_count": 118, - "id": "7d846214", - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "bigann-1B\n", - "10M diff=0.0 % (verif on 10175 / 1000000 = 1/98.3)\n", - "100M diff=0.0 % (verif on 99455 / 1000000 = 1/10.1)\n", - "msturing-1B\n", - "10M diff=0.0 % (verif on 99896 / 10000000 = 1/100.1)\n", - "100M diff=0.0 % (verif on 1000758 / 10000000 = 1/10.0)\n", - "msspacev-1B\n", - "10M diff=0.0 % (verif on 30801 / 2931600 = 1/95.2)\n", - "100M diff=0.0 % (verif on 293540 / 2931600 = 1/10.0)\n", - "deep-1B\n", - "10M diff=0.0 % (verif on 10285 / 1000000 = 1/97.2)\n", - "100M diff=0.0 % (verif on 100663 / 1000000 = 1/9.9)\n", - "text2image-1B\n", - "10M diff=0.0 % (verif on 99944 / 10000000 = 1/100.1)\n", - "100M diff=0.0 % (verif on 999862 / 10000000 = 1/10.0)\n" - ] - } - ], - "source": [ - "basedir = \"/checkpoint/matthijs/billion-scale-ann-benchmarks/GT\"\n", - "\n", - "for dsname in new_gt: \n", - " if dsname == \"ssnpp-1B\": \n", - " continue\n", - " print(dsname)\n", - " I1B, D1B = datasets.knn_result_read(f\"{basedir}_1B/{dsname}\")\n", - " nq = len(I1B)\n", - " ndiff = 0\n", - " eps = D1B.max() * 1e-5\n", - " \n", - " for nb, ss in [(10 ** 7, \"10M\"), (10 ** 8, \"100M\")]: \n", - " ds_sub = dsname.replace(\"1B\", ss)\n", - " Iss, Dss = datasets.knn_result_read(f\"{basedir}_{ss}/{ds_sub}\")\n", - " ndiff = 0\n", - " ltot = 0\n", - " \n", - " for i in range(nq): \n", - " ref_I = I1B[i][I1B[i] < nb]\n", - " ref_D = D1B[i][I1B[i] < nb]\n", - " \n", - " l = len(ref_I)\n", - " ndiff += count_diff_1_result(ref_D, ref_I, Dss[i, :l], Iss[i, :l], eps)\n", - " ltot += l\n", - " \n", - " print(f\"{ss} diff={100 * ndiff / ltot} % (verif on {ltot} / {I1B.size} = 1/{I1B.size/ltot:.1f})\")\n", - " " - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "b704d902", - "metadata": {}, - "outputs": [], - "source": [] - } - ], - "metadata": { - "kernelspec": { - "display_name": "Python 3", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.8.10" - } - }, - "nbformat": 4, - "nbformat_minor": 5 -} diff --git a/notebooks/compare_track1_1B_vs_2x500M.ipynb b/notebooks/compare_track1_1B_vs_2x500M.ipynb deleted file mode 100644 index 861626598..000000000 --- a/notebooks/compare_track1_1B_vs_2x500M.ipynb +++ /dev/null @@ -1,155 +0,0 @@ -{ - "cells": [ - { - "cell_type": "code", - "execution_count": 1, - "id": "b07b0a31", - "metadata": {}, - "outputs": [], - "source": [ - "import numpy as np\n", - "from matplotlib import pyplot" - ] - }, - { - "cell_type": "code", - "execution_count": 22, - "id": "9342ed00", - "metadata": {}, - "outputs": [], - "source": [ - "%matplotlib inline\n", - "%config InlineBackend.figure_format='retina'" - ] - }, - { - "cell_type": "code", - "execution_count": 23, - "id": "7e597ea8", - "metadata": {}, - "outputs": [], - "source": [ - "import sys\n", - "sys.path.append('../')\n", - "\n", - "from track1_baseline_faiss.parse_results import parse_result_file, find_latest_version" - ] - }, - { - "cell_type": "markdown", - "id": "702544bb", - "metadata": {}, - "source": [ - "# with run logs" - ] - }, - { - "cell_type": "markdown", - "id": "db0a4a75", - "metadata": {}, - "source": [ - "Here we compare the QPS for the single machine with 1B vectors setting and the 2 machines with 500M setting." - ] - }, - { - "cell_type": "code", - "execution_count": 54, - "id": "00be8b94", - "metadata": {}, - "outputs": [ - { - "data": { - "image/png": "\n", - "text/plain": [ - "
" - ] - }, - "metadata": { - "image/png": { - "height": 440, - "width": 666 - }, - "needs_background": "light" - }, - "output_type": "display_data" - } - ], - "source": [ - "di = 0\n", - "pyplot.gcf().set_size_inches(11, 7)\n", - "for dsname in \"bigann-1B deep-1B msspacev-1B msturing-1B\".split():\n", - " \n", - " di += 1\n", - " pyplot.subplot(2, 2, di)\n", - " \n", - " # the PQ 4-bit code does not expose enough statistics to do this computation\n", - " for t in \"PQ8bit\", : # \"PQ4bit\": \n", - " \n", - " suf = \"PQ64\" if t == \"PQ8bit\" else \"PQ128x4fsr\"\n", - " \n", - " indexkey, res, keys, stats = parse_result_file(find_latest_version(\n", - " f\"../logs/{dsname}.IVF1M_2level_{suf}.b.log\"))\n", - "\n", - " r10 = res[:, 0]\n", - "\n", - " # simulate QPS w/ 2 shards \n", - " t_per_q = res[:, 1]\n", - " # coarse quantization time\n", - " quant_time = t_per_q * res[:, 3] / 100 \n", - " # half the time to scan inverted lists \n", - " simulated_t = (t_per_q - quant_time) * 0.5 + quant_time\n", - "\n", - " qps = 1000 / simulated_t \n", - "\n", - " pyplot.semilogy(r10, qps, label=\"2x500M, 64 bytes \")\n", - "\n", - " suf = \"PQ32\" if t == \"PQ8bit\" else \"PQ64x4fsr\"\n", - " indexkey, res, keys, stats = parse_result_file(find_latest_version(\n", - " f\"../logs/{dsname}.IVF1M_2level_{suf}.b.log\"))\n", - " \n", - " r10 = res[:, 0]\n", - " # * 2 = we have two machines\n", - " qps = 1000 / res[:, 1] * 2\n", - "\n", - " pyplot.semilogy(r10, qps, label=\"1x1B, 32 bytes\")\n", - "\n", - " pyplot.title(dsname)\n", - " if di >=3: \n", - " pyplot.xlabel(\"inter @ 10\")\n", - " pyplot.ylabel(\"QPS\")\n", - " pyplot.legend()\n", - " pyplot.grid()\n", - " # pyplot.show()" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "e22b90ec", - "metadata": {}, - "outputs": [], - "source": [] - } - ], - "metadata": { - "kernelspec": { - "display_name": "Python 3", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.8.10" - } - }, - "nbformat": 4, - "nbformat_minor": 5 -} diff --git a/notebooks/eval_t2i_results.ipynb b/notebooks/eval_t2i_results.ipynb deleted file mode 100644 index ef293ad6c..000000000 --- a/notebooks/eval_t2i_results.ipynb +++ /dev/null @@ -1,234 +0,0 @@ -{ - "cells": [ - { - "cell_type": "code", - "execution_count": 1, - "id": "936ec4fe", - "metadata": {}, - "outputs": [], - "source": [ - "import numpy as np\n", - "from matplotlib import pyplot" - ] - }, - { - "cell_type": "code", - "execution_count": 2, - "id": "00d04ee8", - "metadata": {}, - "outputs": [], - "source": [ - "%matplotlib inline\n", - "%config InlineBackend.figure_format='retina'" - ] - }, - { - "cell_type": "code", - "execution_count": 3, - "id": "8499fc2c", - "metadata": {}, - "outputs": [], - "source": [ - "import sys\n", - "sys.path.append('../')\n", - "\n", - "from track1_baseline_faiss.parse_results import parse_result_file, find_latest_version" - ] - }, - { - "cell_type": "code", - "execution_count": 4, - "id": "38e8d46b", - "metadata": {}, - "outputs": [], - "source": [ - "dsname = \"text2image-10M\"" - ] - }, - { - "cell_type": "markdown", - "id": "3820d8b4", - "metadata": {}, - "source": [ - "# Results on IVFFlat indexes\n", - "\n", - "This is to see how it performs without compression." - ] - }, - { - "cell_type": "code", - "execution_count": 5, - "id": "ef3aa64a", - "metadata": {}, - "outputs": [ - { - "data": { - "image/png": "\n", - "text/plain": [ - "
" - ] - }, - "metadata": { - "image/png": { - "height": 261, - "width": 387 - }, - "needs_background": "light" - }, - "output_type": "display_data" - } - ], - "source": [ - "for key in \"IVF16k\", \"IVF16k_HNSW\", \"IVF16k_2level\", \"IVF16k_2level_HNSW\": \n", - " \n", - "\n", - " indexkey, res, keys, stats = parse_result_file(find_latest_version(\n", - " f\"../logs/{dsname}.{key}.b.log\"))\n", - " \n", - " if res.size == 0: \n", - " print(\"skip\", key)\n", - " continue\n", - " \n", - " r10 = res[:, 0]\n", - " qps = 1000 / res[:, 1]\n", - " \n", - " pyplot.semilogy(r10, qps, label=key)\n", - "\n", - "\n", - "pyplot.xlabel(\"inter @ 10\")\n", - "pyplot.ylabel(\"QPS\")\n", - "pyplot.legend()\n", - "pyplot.grid()" - ] - }, - { - "cell_type": "markdown", - "id": "140cd7a7", - "metadata": {}, - "source": [ - "It performs pretty well, even in combination with HNSW and 2-level encoding. \n", - "\n", - "# Compression \n", - "\n", - "Here we fix the coarse quantizer and evaluate compression options" - ] - }, - { - "cell_type": "code", - "execution_count": 13, - "id": "f01c7309", - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "IVF16k\n", - "IVF16k,PQ48\n", - "IVF16k,PQ64\n", - "IVF16k,RR192_PQ32\n", - "IVF16k,SQ4\n", - "IVF16k,SQ4_PCAR100\n", - "IVF16k,SQ6\n", - "IVF16k,SQ6_nores\n", - "skip IVF16k,SQ6_nores\n", - "IVF16k,SQ8\n", - "IVF16k,SQ8_PQ32\n", - "IVF16k,SQ8_PQ32_nores\n", - "skip IVF16k,SQ8_PQ32_nores\n", - "IVF16k,SQ8_nores\n", - "skip IVF16k,SQ8_nores\n" - ] - }, - { - "data": { - "image/png": "\n", - "text/plain": [ - "
" - ] - }, - "metadata": { - "image/png": { - "height": 440, - "width": 666 - }, - "needs_background": "light" - }, - "output_type": "display_data" - } - ], - "source": [ - "allkeys=\"\"\"\n", - "IVF16k IVF16k,SQ8 IVF16k,SQ8_nores \n", - "IVF16k,SQ6 IVF16k,SQ6_nores \n", - "IVF16k,SQ8_PQ32 IVF16k,SQ8_PQ32_nores \n", - "IVF16k,SQ4 IVF16k,SQ4_PCAR100 \n", - "IVF16k,RR192_PQ32 IVF16k,PQ64 IVF16k,PQ48\"\"\"\n", - "\n", - "for key in sorted(allkeys.split()): \n", - " print(key)\n", - " indexkey, res, keys, stats = parse_result_file(find_latest_version(\n", - " f\"../logs/{dsname}.{key}.b.log\"))\n", - " \n", - " if res.size == 0 or \"nores\" in key: \n", - " print(\"skip\", key)\n", - " continue\n", - " \n", - " r10 = res[:, 0]\n", - " qps = 1000 / res[:, 1]\n", - " \n", - " pyplot.semilogy(\n", - " r10, qps, \n", - " 'o-' if \"PQ\" in key else \n", - " \"+-\" if \"SQ\" in key else \"-\", \n", - " label=indexkey or key)\n", - "\n", - "pyplot.title(dsname)\n", - "pyplot.xlabel(\"inter @ 10\")\n", - "pyplot.ylabel(\"QPS\")\n", - "pyplot.legend()\n", - "pyplot.grid()\n", - "pyplot.gcf().set_size_inches(11, 7)" - ] - }, - { - "cell_type": "code", - "execution_count": 26, - "id": "c4edbd1f", - "metadata": {}, - "outputs": [], - "source": [ - "indexkey" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "5e103039", - "metadata": {}, - "outputs": [], - "source": [] - } - ], - "metadata": { - "kernelspec": { - "display_name": "Python 3", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.8.10" - } - }, - "nbformat": 4, - "nbformat_minor": 5 -} diff --git a/notebooks/find_suitable_nq.ipynb b/notebooks/find_suitable_nq.ipynb deleted file mode 100644 index 80d465dff..000000000 --- a/notebooks/find_suitable_nq.ipynb +++ /dev/null @@ -1,323 +0,0 @@ -{ - "cells": [ - { - "cell_type": "markdown", - "id": "sealed-vertical", - "metadata": {}, - "source": [ - "The purpose of this notebook is to evaluate how many query vectors (nq) we need \n", - "to get an accurate estimate of the intersection @ 10 measure. \n" - ] - }, - { - "cell_type": "code", - "execution_count": 55, - "id": "hairy-relaxation", - "metadata": {}, - "outputs": [], - "source": [ - "import numpy as np\n", - "import faiss\n", - "from faiss.contrib import datasets\n", - "from matplotlib import pyplot" - ] - }, - { - "cell_type": "code", - "execution_count": 69, - "id": "emotional-filter", - "metadata": {}, - "outputs": [], - "source": [ - "# start with BigANN 10M\n", - "\n", - "ds = datasets.DatasetBigANN(10)" - ] - }, - { - "cell_type": "code", - "execution_count": 5, - "id": "alpha-webcam", - "metadata": {}, - "outputs": [], - "source": [ - "# we need more query vectors than the usual 10k, so pick them from the training set\n", - "\n", - "xtt = ds.get_train(maxtrain=2 * 10**6)\n", - "\n", - "big_xq = xtt[:10**6] # 1M queries \n", - "xt = xtt[10**6:] # 1M training vectors" - ] - }, - { - "cell_type": "markdown", - "id": "imported-variance", - "metadata": {}, - "source": [ - "# Ground truth" - ] - }, - { - "cell_type": "code", - "execution_count": 18, - "id": "adequate-jefferson", - "metadata": {}, - "outputs": [], - "source": [ - "index = faiss.IndexFlatL2(128)\n", - "index.add(ds.get_database())" - ] - }, - { - "cell_type": "code", - "execution_count": 19, - "id": "minus-defendant", - "metadata": {}, - "outputs": [], - "source": [ - "index = faiss.index_cpu_to_all_gpus(index, ngpu=1)" - ] - }, - { - "cell_type": "code", - "execution_count": 20, - "id": "trying-andorra", - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "CPU times: user 4min 59s, sys: 2min 8s, total: 7min 8s\n", - "Wall time: 7min 8s\n" - ] - } - ], - "source": [ - "%%time\n", - "Dgt, Igt = index.search(big_xq, 10)" - ] - }, - { - "cell_type": "code", - "execution_count": 21, - "id": "maritime-oriental", - "metadata": {}, - "outputs": [], - "source": [ - "np.save(\"/tmp/Dgt.npy\", Dgt)\n", - "np.save(\"/tmp/Igt.npy\", Igt)" - ] - }, - { - "cell_type": "markdown", - "id": "supreme-jewel", - "metadata": {}, - "source": [ - "# With some index" - ] - }, - { - "cell_type": "code", - "execution_count": 27, - "id": "comic-therapy", - "metadata": {}, - "outputs": [], - "source": [ - "# we pick some index that has one search-time parameter \n", - "# to represent different speed-accuracy tradeoffs.\n", - "\n", - "index = faiss.index_factory(128, \"IVF16384,SQ4\")\n", - "index = faiss.index_cpu_to_all_gpus(index, ngpu=1)\n", - "\n", - "index.train(xt)\n", - "\n", - "index.add(ds.get_database())" - ] - }, - { - "cell_type": "code", - "execution_count": 48, - "id": "perfect-associate", - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "1\n", - "4\n", - "16\n", - "64\n" - ] - } - ], - "source": [ - "# run queries \n", - "\n", - "res_per_nprobe = {}\n", - "for nprobe in 1, 4, 16, 64:\n", - " print(nprobe)\n", - " D, I = [], []\n", - " index.nprobe = nprobe\n", - " # Faiss crashes when searching all at once\n", - " for i0 in range(0, 10**6, 10000): \n", - " Di, Ii = index.search(big_xq[i0 : i0 + 10000], 10)\n", - " D.append(Di)\n", - " I.append(Ii)\n", - " D = np.vstack(D)\n", - " I = np.vstack(I)\n", - " res_per_nprobe[nprobe] = I" - ] - }, - { - "cell_type": "markdown", - "id": "novel-yukon", - "metadata": {}, - "source": [ - "# Stats on intersection measure" - ] - }, - { - "cell_type": "code", - "execution_count": 70, - "id": "polish-sheep", - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "nprobe 1 inter 25.914 %\n", - "nprobe 4 inter 49.756 %\n", - "nprobe 16 inter 68.647 %\n", - "nprobe 64 inter 77.002 %\n" - ] - } - ], - "source": [ - "# evaluate intersection measures for the 1M queries\n", - "\n", - "for nprobe in 1, 4, 16, 64: \n", - " I = res_per_nprobe[nprobe]\n", - " ninter = faiss.eval_intersection(I, Igt)\n", - " print(f\"nprobe {nprobe:-5d} inter {100 * ninter/I.size:.3f} %\")" - ] - }, - { - "cell_type": "code", - "execution_count": 60, - "id": "consistent-service", - "metadata": {}, - "outputs": [ - { - "data": { - "image/png": "\n", - "text/plain": [ - "
" - ] - }, - "metadata": { - "needs_background": "light" - }, - "output_type": "display_data" - } - ], - "source": [ - "# collect per-query intersections\n", - "\n", - "all_ninters = {}\n", - "for nprobe in 1, 4, 16, 64: \n", - " I = res_per_nprobe[nprobe] \n", - " ninters = [\n", - " faiss.eval_intersection(I[i0 : i0 + 1], Igt[i0 : i0 + 1])\n", - " for i0 in range(10**6)\n", - " ]\n", - " all_ninters[nprobe] = ninters\n", - " pyplot.plot(np.bincount(ninters), 'o-', label=f\"nprobe {nprobe}\")\n", - "pyplot.xlabel(\"nb intersections\")\n", - "pyplot.ylabel(\"nb queries\")\n", - "pyplot.legend()\n", - "pyplot.grid() \n" - ] - }, - { - "cell_type": "code", - "execution_count": 68, - "id": "unavailable-forward", - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "nprobe 1\n", - "n= 1000 stddev 0.705 %\n", - "n= 10000 stddev 0.223 %\n", - "n= 100000 stddev 0.071 %\n", - "n=1000000 stddev 0.022 %\n", - "nprobe 4\n", - "n= 1000 stddev 0.727 %\n", - "n= 10000 stddev 0.230 %\n", - "n= 100000 stddev 0.073 %\n", - "n=1000000 stddev 0.023 %\n", - "nprobe 16\n", - "n= 1000 stddev 0.525 %\n", - "n= 10000 stddev 0.166 %\n", - "n= 100000 stddev 0.053 %\n", - "n=1000000 stddev 0.017 %\n", - "nprobe 64\n", - "n= 1000 stddev 0.382 %\n", - "n= 10000 stddev 0.121 %\n", - "n= 100000 stddev 0.038 %\n", - "n=1000000 stddev 0.012 %\n" - ] - } - ], - "source": [ - "# do some math to compute standard deviations\n", - "\n", - "for nprobe in 1, 4, 16, 64: \n", - " intersection_measures = np.array(all_ninters[nprobe]) / 10 \n", - " variance = intersection_measures.var()\n", - " print(\"nprobe\", nprobe)\n", - " for n in 10**3, 10**4, 10**5, 10**6: \n", - " # sum of independent variables\n", - " # https://en.wikipedia.org/wiki/Variance#Sum_of_uncorrelated_variables_.28Bienaym.C3.A9_formula.29\n", - " variance_of_sum = n * variance\n", - " variance_of_mean = variance_of_sum * (1 / n) ** 2\n", - " sttdev_of_mean = np.sqrt(variance_of_mean)\n", - " print(f\"n={n:-7} stddev {100*sttdev_of_mean:.3f} % (percentage points)\")" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "realistic-guinea", - "metadata": {}, - "outputs": [], - "source": [] - } - ], - "metadata": { - "kernelspec": { - "display_name": "Python 3", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.7.9" - } - }, - "nbformat": 4, - "nbformat_minor": 5 -} diff --git a/notebooks/large_coarse_quantizer.ipynb b/notebooks/large_coarse_quantizer.ipynb deleted file mode 100644 index ecccd1401..000000000 --- a/notebooks/large_coarse_quantizer.ipynb +++ /dev/null @@ -1,586 +0,0 @@ -{ - "cells": [ - { - "cell_type": "markdown", - "id": "9f85f826", - "metadata": {}, - "source": [ - "It is useful to cluster the 1B datasets to around 262k - 1M clusters for IVF indexing with Faiss.\n", - "However, it is not feasible to do the clustering within the allocated time for indexing. \n", - "\n", - "Therefore, here we evaluate other options to break down the clustering cost, while getting the same number of clusters.\n", - "The model that we use is: Deep1M (1M database vectors), 4096 clusters (which conveniently breaks down to 2^6 * 2^6)\n" - ] - }, - { - "cell_type": "code", - "execution_count": 1, - "id": "ongoing-first", - "metadata": {}, - "outputs": [], - "source": [ - "import numpy as np\n", - "import faiss\n", - "from faiss.contrib import datasets" - ] - }, - { - "cell_type": "code", - "execution_count": 3, - "id": "finnish-giant", - "metadata": {}, - "outputs": [], - "source": [ - "ds = datasets.DatasetDeep1B(10**6)" - ] - }, - { - "cell_type": "code", - "execution_count": 4, - "id": "satisfied-adoption", - "metadata": {}, - "outputs": [], - "source": [ - "xt = ds.get_train(10**5)\n", - "d = ds.d\n", - "xb = ds.get_database()\n", - "xq = ds.get_queries()\n", - "gt = ds.get_groundtruth()\n" - ] - }, - { - "cell_type": "code", - "execution_count": 5, - "id": "genetic-sleep", - "metadata": {}, - "outputs": [], - "source": [ - "sqrt_nlist = 64\n", - "nlist = sqrt_nlist**2" - ] - }, - { - "cell_type": "markdown", - "id": "indoor-client", - "metadata": {}, - "source": [ - "# Flat quantizer" - ] - }, - { - "cell_type": "markdown", - "id": "1a18ca10", - "metadata": {}, - "source": [ - "Flat quantizer is what we would like to apprach, but it probably too costly. \n", - "We include it here as a topline.\n", - "The measure we use is recall of nearest neighbor vs. number of computed distances." - ] - }, - { - "cell_type": "code", - "execution_count": 22, - "id": "romance-pacific", - "metadata": {}, - "outputs": [], - "source": [ - "quantizer = faiss.IndexFlatL2(d)\n", - "index = faiss.IndexIVFFlat(quantizer, d, nlist)" - ] - }, - { - "cell_type": "code", - "execution_count": 23, - "id": "noble-possession", - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "1.431187283968" - ] - }, - "execution_count": 23, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "index.train(xt)\n", - "index.add(xb)\n", - "index.invlists.imbalance_factor()" - ] - }, - { - "cell_type": "code", - "execution_count": 24, - "id": "described-chicago", - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "nprobe=1 1-recall @ 1: 0.3745 dis/q=349.15\n", - "nprobe=4 1-recall @ 1: 0.6849 dis/q=1344.67\n", - "nprobe=16 1-recall @ 1: 0.9004 dis/q=5040.35\n", - "nprobe=64 1-recall @ 1: 0.9793 dis/q=18331.49\n" - ] - } - ], - "source": [ - "stats = faiss.cvar.indexIVF_stats\n", - "for nprobe in 1, 4, 16, 64: \n", - " index.nprobe = nprobe \n", - " stats.reset()\n", - " D, I = index.search(xq, 100)\n", - " rank = 1\n", - " recall = (I[:, :rank] == gt[:, :1]).sum() / len(xq)\n", - " print(f\"nprobe={nprobe} 1-recall @ {rank}: {recall} dis/q={stats.ndis/len(xq):.2f}\")" - ] - }, - { - "cell_type": "markdown", - "id": "realistic-valve", - "metadata": {}, - "source": [ - "# IMI quantizer" - ] - }, - { - "cell_type": "markdown", - "id": "c0388876", - "metadata": {}, - "source": [ - "The IMI quantizer is a cheap way of breaking down the dataset into buckets. It is a PQ2x6 and each PQ code ends in a separate bucket. " - ] - }, - { - "cell_type": "code", - "execution_count": 25, - "id": "amateur-earth", - "metadata": {}, - "outputs": [], - "source": [ - "quantizer = faiss.MultiIndexQuantizer(d, 2, int(np.log2(sqrt_nlist)))" - ] - }, - { - "cell_type": "code", - "execution_count": 26, - "id": "unsigned-motorcycle", - "metadata": {}, - "outputs": [], - "source": [ - "index = faiss.IndexIVFFlat(quantizer, d, nlist)\n", - "index.quantizer_trains_alone = 1" - ] - }, - { - "cell_type": "code", - "execution_count": 27, - "id": "organizational-impossible", - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "16.421237645312" - ] - }, - "execution_count": 27, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "index.train(xt)\n", - "index.add(xb)\n", - "index.invlists.imbalance_factor()\n" - ] - }, - { - "cell_type": "code", - "execution_count": 28, - "id": "7be36ece", - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "nprobe=1 1-recall @ 1: 0.437 dis/q=3972.32\n", - "nprobe=4 1-recall @ 1: 0.6948 dis/q=9210.20\n", - "nprobe=16 1-recall @ 1: 0.8656 dis/q=19246.74\n", - "nprobe=64 1-recall @ 1: 0.9613 dis/q=41114.89\n" - ] - } - ], - "source": [ - "stats = faiss.cvar.indexIVF_stats\n", - "\n", - "for nprobe in 1, 4, 16, 64: \n", - " index.nprobe = nprobe \n", - " stats.reset()\n", - "\n", - " D, I = index.search(xq, 100)\n", - " rank = 1\n", - " recall = (I[:, :rank] == gt[:, :1]).sum() / len(xq)\n", - " print(f\"nprobe={nprobe} 1-recall @ {rank}: {recall} dis/q={stats.ndis/len(xq):.2f}\")" - ] - }, - { - "cell_type": "markdown", - "id": "cc986a53", - "metadata": {}, - "source": [ - "So way less efficient than the flat quantizer, due to imbalanced inverted lists. TBH, the IMI quantizer usually sets a cap on the number of distances rather than fixing the number of visited buckets. " - ] - }, - { - "cell_type": "markdown", - "id": "south-differential", - "metadata": {}, - "source": [ - "# Residual quantizer" - ] - }, - { - "cell_type": "markdown", - "id": "9e5910d8", - "metadata": {}, - "source": [ - "This is a 2-level additive quantizer where the first level is trained first, then the second. Since it is an additive quantizer, the top-k centroids can be retrieved efficiently with lookup tables. " - ] - }, - { - "cell_type": "code", - "execution_count": 33, - "id": "elect-vacation", - "metadata": {}, - "outputs": [], - "source": [ - "quantizer = faiss.ResidualCoarseQuantizer(d, 2, int(np.log2(sqrt_nlist)))" - ] - }, - { - "cell_type": "code", - "execution_count": 34, - "id": "nervous-lesbian", - "metadata": {}, - "outputs": [], - "source": [ - "index = faiss.IndexIVFFlat(quantizer, d, nlist)\n", - "index.quantizer_trains_alone = 1" - ] - }, - { - "cell_type": "code", - "execution_count": 35, - "id": "ae530558", - "metadata": {}, - "outputs": [], - "source": [ - "index.train(xt)" - ] - }, - { - "cell_type": "code", - "execution_count": 40, - "id": "ceaa6077", - "metadata": {}, - "outputs": [], - "source": [ - "quantizer.set_beam_factor(-1)" - ] - }, - { - "cell_type": "code", - "execution_count": 41, - "id": "3eb25d40", - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "3.604173447168" - ] - }, - "execution_count": 41, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "index.add(xb)\n", - "index.invlists.imbalance_factor()" - ] - }, - { - "cell_type": "code", - "execution_count": 42, - "id": "af3a02de", - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "nprobe=1 1-recall @ 1: 0.3079 dis/q=878.77\n", - "nprobe=4 1-recall @ 1: 0.6091 dis/q=3017.90\n", - "nprobe=16 1-recall @ 1: 0.8608 dis/q=9996.18\n", - "nprobe=64 1-recall @ 1: 0.9685 dis/q=31318.18\n" - ] - } - ], - "source": [ - "stats = faiss.cvar.indexIVF_stats\n", - "\n", - "for nprobe in 1, 4, 16, 64: \n", - " index.nprobe = nprobe \n", - " stats.reset()\n", - "\n", - " D, I = index.search(xq, 100)\n", - " rank = 1\n", - " recall = (I[:, :rank] == gt[:, :1]).sum() / len(xq)\n", - " print(f\"nprobe={nprobe} 1-recall @ {rank}: {recall} dis/q={stats.ndis/len(xq):.2f}\")" - ] - }, - { - "cell_type": "markdown", - "id": "b9db020c", - "metadata": {}, - "source": [ - "Unfortunately still not very good. " - ] - }, - { - "cell_type": "markdown", - "id": "9a0514ef", - "metadata": {}, - "source": [ - "# 2-level tree quantizer" - ] - }, - { - "cell_type": "markdown", - "id": "adfc3b23", - "metadata": {}, - "source": [ - "This is a suggestion by Harsha: just cluster to 64 centroids at the first level and train separate clusterings within each bucket." - ] - }, - { - "cell_type": "code", - "execution_count": 47, - "id": "4f86ff7a", - "metadata": {}, - "outputs": [], - "source": [ - "# 1st level quantizer " - ] - }, - { - "cell_type": "code", - "execution_count": 48, - "id": "8157ef04", - "metadata": {}, - "outputs": [], - "source": [ - "km = faiss.Kmeans(d, sqrt_nlist)" - ] - }, - { - "cell_type": "code", - "execution_count": 49, - "id": "29b154ce", - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "9879.4462890625" - ] - }, - "execution_count": 49, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "km.train(xt)" - ] - }, - { - "cell_type": "code", - "execution_count": 50, - "id": "27a355a7", - "metadata": {}, - "outputs": [], - "source": [ - "centroids1 = km.centroids" - ] - }, - { - "cell_type": "code", - "execution_count": 62, - "id": "6083d36f", - "metadata": {}, - "outputs": [], - "source": [ - "xt2 = ds.get_train(500_000)\n", - "\n", - "_, assign1 = km.assign(xt2)\n", - "bc = np.bincount(assign1)\n", - "o = assign1.argsort()" - ] - }, - { - "cell_type": "code", - "execution_count": 64, - "id": "32e64dfb", - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "63\r" - ] - } - ], - "source": [ - "i0 = 0\n", - "c2 = []\n", - "for c1 in range(sqrt_nlist): \n", - " print(c1, end=\"\\r\", flush=True)\n", - " i1 = i0 + bc[c1]\n", - " subset = o[i0:i1]\n", - " assert np.all(assign1[subset] == c1)\n", - " km = faiss.Kmeans(d, sqrt_nlist)\n", - " xtsub = xt2[subset]\n", - " km.train(xtsub)\n", - " c2.append(km.centroids)\n", - " i0 = i1" - ] - }, - { - "cell_type": "markdown", - "id": "704c495a", - "metadata": {}, - "source": [ - "Then we just stack the centroids together and forget about the first level clustering. \n", - "In reality with 262k-1M clusters, we'll train a HNSW or NSG index on top. " - ] - }, - { - "cell_type": "code", - "execution_count": 65, - "id": "b41aeeae", - "metadata": {}, - "outputs": [], - "source": [ - "centroids12 = np.vstack(c2)" - ] - }, - { - "cell_type": "code", - "execution_count": 66, - "id": "7041f966", - "metadata": {}, - "outputs": [], - "source": [ - "quantizer = faiss.IndexFlatL2(d)\n", - "quantizer.add(centroids12)\n", - "index = faiss.IndexIVFFlat(quantizer, d, nlist)" - ] - }, - { - "cell_type": "code", - "execution_count": 68, - "id": "1bf4175d", - "metadata": {}, - "outputs": [ - { - "data": { - "text/plain": [ - "1.200742457344" - ] - }, - "execution_count": 68, - "metadata": {}, - "output_type": "execute_result" - } - ], - "source": [ - "index.add(xb)\n", - "index.invlists.imbalance_factor()" - ] - }, - { - "cell_type": "code", - "execution_count": 69, - "id": "6d2acf15", - "metadata": {}, - "outputs": [ - { - "name": "stdout", - "output_type": "stream", - "text": [ - "nprobe=1 1-recall @ 1: 0.3774 dis/q=291.20\n", - "nprobe=4 1-recall @ 1: 0.6847 dis/q=1153.03\n", - "nprobe=16 1-recall @ 1: 0.8995 dis/q=4459.66\n", - "nprobe=64 1-recall @ 1: 0.9825 dis/q=16942.70\n" - ] - } - ], - "source": [ - "stats = faiss.cvar.indexIVF_stats\n", - "for nprobe in 1, 4, 16, 64: \n", - " index.nprobe = nprobe \n", - " stats.reset()\n", - " D, I = index.search(xq, 100)\n", - " rank = 1\n", - " recall = (I[:, :rank] == gt[:, :1]).sum() / len(xq)\n", - " print(f\"nprobe={nprobe} 1-recall @ {rank}: {recall} dis/q={stats.ndis/len(xq):.2f}\")" - ] - }, - { - "cell_type": "markdown", - "id": "35c0a565", - "metadata": {}, - "source": [ - "Turns out this is very good: same level of accuracy as the flat topline!" - ] - }, - { - "cell_type": "code", - "execution_count": null, - "id": "1b4f1c3a", - "metadata": {}, - "outputs": [], - "source": [] - } - ], - "metadata": { - "kernelspec": { - "display_name": "Python 3", - "language": "python", - "name": "python3" - }, - "language_info": { - "codemirror_mode": { - "name": "ipython", - "version": 3 - }, - "file_extension": ".py", - "mimetype": "text/x-python", - "name": "python", - "nbconvert_exporter": "python", - "pygments_lexer": "ipython3", - "version": "3.8.10" - } - }, - "nbformat": 4, - "nbformat_minor": 5 -} diff --git a/plot.py b/plot.py deleted file mode 100644 index 941b78cab..000000000 --- a/plot.py +++ /dev/null @@ -1,160 +0,0 @@ -import os -import matplotlib as mpl -mpl.use('Agg') # noqa -import matplotlib.pyplot as plt -import numpy as np -import argparse - -from benchmark.datasets import DATASETS -from benchmark.algorithms.definitions import get_definitions -from benchmark.plotting.metrics import all_metrics as metrics -from benchmark.plotting.utils import (get_plot_label, compute_metrics, - create_linestyles, create_pointset) -from benchmark.results import (store_results, load_all_results, - get_unique_algorithms) - - -def create_plot(all_data, raw, x_scale, y_scale, xn, yn, fn_out, linestyles): - xm, ym = (metrics[xn], metrics[yn]) - # Now generate each plot - handles = [] - labels = [] - plt.figure(figsize=(12, 9)) - - # Sorting by mean y-value helps aligning plots with labels - def mean_y(algo): - xs, ys, ls, axs, ays, als = create_pointset(all_data[algo], xn, yn) - return -np.log(np.array(ys)).mean() - # Find range for logit x-scale - min_x, max_x = 1, 0 - for algo in sorted(all_data.keys(), key=mean_y): - xs, ys, ls, axs, ays, als = create_pointset(all_data[algo], xn, yn) - min_x = min([min_x]+[x for x in xs if x > 0]) - max_x = max([max_x]+[x for x in xs if x < 1]) - color, faded, linestyle, marker = linestyles[algo] - handle, = plt.plot(xs, ys, '-', label=algo, color=color, - ms=7, mew=3, lw=3, linestyle=linestyle, - marker=marker) - handles.append(handle) - if raw: - handle2, = plt.plot(axs, ays, '-', label=algo, color=faded, - ms=5, mew=2, lw=2, linestyle=linestyle, - marker=marker) - labels.append(algo) - - ax = plt.gca() - ax.set_ylabel(ym['description']) - ax.set_xlabel(xm['description']) - # Custom scales of the type --x-scale a3 - if x_scale[0] == 'a': - alpha = int(x_scale[1:]) - fun = lambda x: 1-(1-x)**(1/alpha) - inv_fun = lambda x: 1-(1-x)**alpha - ax.set_xscale('function', functions=(fun, inv_fun)) - if alpha <= 3: - ticks = [inv_fun(x) for x in np.arange(0,1.2,.2)] - plt.xticks(ticks) - if alpha > 3: - from matplotlib import ticker - ax.xaxis.set_major_formatter(ticker.LogitFormatter()) - #plt.xticks(ticker.LogitLocator().tick_values(min_x, max_x)) - plt.xticks([0, 1/2, 1-1e-1, 1-1e-2, 1-1e-3, 1-1e-4, 1]) - # Other x-scales - else: - ax.set_xscale(x_scale) - ax.set_yscale(y_scale) - ax.set_title(get_plot_label(xm, ym)) - box = plt.gca().get_position() - # plt.gca().set_position([box.x0, box.y0, box.width * 0.8, box.height]) - ax.legend(handles, labels, loc='center left', - bbox_to_anchor=(1, 0.5), prop={'size': 9}) - plt.grid(b=True, which='major', color='0.65', linestyle='-') - plt.setp(ax.get_xminorticklabels(), visible=True) - - # Logit scale has to be a subset of (0,1) - if 'lim' in xm and x_scale != 'logit': - x0, x1 = xm['lim'] - plt.xlim(max(x0,0), min(x1,1)) - elif x_scale == 'logit': - plt.xlim(min_x, max_x) - if 'lim' in ym: - plt.ylim(ym['lim']) - - # Workaround for bug https://github.com/matplotlib/matplotlib/issues/6789 - ax.spines['bottom']._adjust_location() - - plt.savefig(fn_out, bbox_inches='tight') - plt.close() - - -if __name__ == "__main__": - parser = argparse.ArgumentParser() - parser.add_argument( - '--dataset', - metavar="DATASET", - default='sift-1M') - parser.add_argument( - '--count', - default=-1, - type=int) - parser.add_argument( - '--definitions', - metavar='FILE', - help='load algorithm definitions from FILE', - default='algos.yaml') - parser.add_argument( - '--limit', - default=-1) - parser.add_argument( - '-o', '--output') - parser.add_argument( - '-x', '--x-axis', - help='Which metric to use on the X-axis', - choices=metrics.keys(), - default="k-nn") - parser.add_argument( - '-y', '--y-axis', - help='Which metric to use on the Y-axis', - choices=metrics.keys(), - default="qps") - parser.add_argument( - '-X', '--x-scale', - help='Scale to use when drawing the X-axis. Typically linear, logit or a2', - default='linear') - parser.add_argument( - '-Y', '--y-scale', - help='Scale to use when drawing the Y-axis', - choices=["linear", "log", "symlog", "logit"], - default='linear') - parser.add_argument( - '--raw', - help='Show raw results (not just Pareto frontier) in faded colours', - action='store_true') - parser.add_argument( - '--recompute', - help='Clears the cache and recomputes the metrics', - action='store_true') - args = parser.parse_args() - - if not args.output: - args.output = 'results/%s.png' % (args.dataset) - print('writing output to %s' % args.output) - - dataset = DATASETS[args.dataset]() - - if args.count == -1: - args.count = dataset.default_count() - if args.x_axis == "k-nn" and dataset.search_type() == "range": - args.x_axis = "ap" - count = int(args.count) - unique_algorithms = get_unique_algorithms() - results = load_all_results(args.dataset, count) - linestyles = create_linestyles(sorted(unique_algorithms)) - runs = compute_metrics(dataset.get_groundtruth(k=args.count), - results, args.x_axis, args.y_axis, args.recompute) - if not runs: - raise Exception('Nothing to plot') - - create_plot(runs, args.raw, args.x_scale, - args.y_scale, args.x_axis, args.y_axis, args.output, - linestyles) diff --git a/requirements.txt b/requirements.txt deleted file mode 100644 index 62ffd69d7..000000000 --- a/requirements.txt +++ /dev/null @@ -1,11 +0,0 @@ -ansicolors==1.1.8 -docker==2.6.1 -h5py==2.10.0 -matplotlib==2.1.0 -numpy==1.16.0 -pyyaml==5.4 -psutil==5.6.6 -scipy==1.0.0 -scikit-learn==0.19.1 -jinja2==2.11.3 -pandas diff --git a/requirements_py38.txt b/requirements_py38.txt deleted file mode 100644 index 503d4cf7f..000000000 --- a/requirements_py38.txt +++ /dev/null @@ -1,11 +0,0 @@ -ansicolors==1.1.8 -docker==2.6.1 -h5py==2.10.0 -matplotlib==3.3.4 -numpy==1.19.5 -pyyaml==5.4 -psutil==5.8.0 -scipy==1.5.4 -scikit-learn -jinja2==2.11.3 -pandas==1.1.5 diff --git a/run.py b/run.py deleted file mode 100644 index 043943b25..000000000 --- a/run.py +++ /dev/null @@ -1,6 +0,0 @@ -from benchmark.main import main -from multiprocessing import freeze_support - -if __name__ == "__main__": - freeze_support() - main() diff --git a/run_algorithm.py b/run_algorithm.py deleted file mode 100644 index cdf383ddd..000000000 --- a/run_algorithm.py +++ /dev/null @@ -1,3 +0,0 @@ -from benchmark.runner import run_from_cmdline - -run_from_cmdline() diff --git a/style.css b/style.css new file mode 100644 index 000000000..b4243362a --- /dev/null +++ b/style.css @@ -0,0 +1,572 @@ +:root { + --color-navy: #01004b; + --color-blue: #1c17ff; + --color-light-gray: #f1f5f8; + --color-gray: #525252; + + --spacing-sm: 1.5625rem; /* 25px */ + --spacing-md: 3.125rem; /* 50px */ + --spacing-lg: 4.6875rem; /* 75px */ +} + +@font-face { + font-family: "MediumLLWeb"; + src: url("/fonts/MediumLLWeb-Regular.woff2") format("woff2"); + font-weight: 400; + font-style: normal; + font-display: swap; +} + +@font-face { + font-family: "MediumLLWeb"; + src: url("/fonts/MediumLLWeb-SemiBold.woff2") format("woff2"); + font-weight: 600; + font-style: normal; + font-display: swap; +} + +*, +*:before, +*:after { + box-sizing: border-box; + margin: 0; + padding: 0; +} + +html { + scroll-behavior: smooth; +} + +body { + font-family: "MediumLLWeb", sans-serif; +} + +h1 { + font-size: 2.75rem; + line-height: 3.3rem; +} + +h2 { + font-size: 1.875rem; + line-height: 2.25rem; +} + +h3 { + font-size: 1.25rem; + line-height: 1.75rem; +} + +h4 { + font-size: 1.125rem; + line-height: 1.5rem; +} + +/* Text */ +p, +li { + font-size: 1rem; + line-height: 1.375rem; +} + +a { + text-decoration: none; + color: var(--color-blue); + transition: color 0.3s ease-in-out; +} + +a:hover { + color: var(--color-navy); +} + +.container { + width: 100%; + max-width: 77rem; + margin: 0 auto; + padding-left: 1.5rem; + padding-right: 1.5rem; +} + +/* Header/footer */ +.header { + background-color: #fff; + position: sticky; + top: 0; +} + +.footer { + background-color: var(--color-navy); +} + +.header a, +.footer a { + text-decoration: none; + font-size: 1rem; +} + +.header a { + color: #000; +} + +.footer a { + color: #fff; +} + +.header > .container, +.footer > .container { + display: flex; + justify-content: space-between; + align-items: center; + padding-top: var(--spacing-sm); + padding-bottom: var(--spacing-sm); + gap: var(--spacing-sm); + /* max-width: 56rem; */ +} + +.footer > .container { + flex-direction: column; + align-items: center; +} + +/* Header/footer Title */ +.header .title, +.footer .title { + text-decoration: none; + font-weight: 600; + white-space: nowrap; +} + +/* Nav */ +.header nav, +.header .external-links { + display: none; +} + +.header nav > ul, +.footer nav > ul { + display: flex; + flex-wrap: wrap; + list-style: none; + justify-content: center; + row-gap: 1rem; + column-gap: 1.875rem; +} + +/* External / logo links */ +.external-links { + display: flex; + gap: 1.875rem; +} + +.external-links img { + width: 1.875rem; + height: 1.875rem; + object-fit: contain; +} + +.content-section { + padding-top: var(--spacing-md); + padding-bottom: var(--spacing-md); +} + +/* Hero */ +.hero { + background-color: var(--color-light-gray); +} + +.hero > .container { + text-align: center; + display: flex; + flex-direction: column; + gap: var(--spacing-md); +} + +.hero-eyebrow { + font-weight: 600; + color: var(--color-navy); +} + +.hero h1 { + margin-top: var(--spacing-sm); + color: var(--color-navy); +} + +.hero h1 > span { + display: block; + color: var(--color-blue); +} + +.hero .buttons { + display: flex; + flex-wrap: wrap; + justify-content: center; + gap: 1.25rem; +} + +.button { + width: 100%; + padding: 0.75rem 1.875rem; + font-size: 1.125rem; + font-weight: 600; + text-decoration: none; + background-color: var(--color-blue); + border: 2px solid var(--color-blue); + border-radius: 5px; + color: #fff; + transition: all 0.3s ease-in-out; + text-align: center; +} + +.button.button-white { + background-color: #fff; + color: var(--color-blue); + border: 2px solid var(--color-blue); +} + +.button.button-alpha:hover { + color: #fff; + background-color: #030080; + border-color: #030080; +} + +.button.button-white:hover { + background-color: var(--color-light-gray); +} + +.presented-by { + font-size: 1.25rem; + line-height: 1.75rem; + text-align: center; + display: flex; + flex-wrap: wrap; + justify-content: center; + align-items: baseline; + gap: 0.9375rem; +} + +.presented-by .microsoft-logo, +.presented-by .pinecone-logo { + width: 7rem; + height: auto; +} + +.presented-by .aws-logo { + width: 2.5rem; + height: auto; +} + +.presented-by .zilliz-logo { + width: 6rem; + height: auto; +} + +.hero .hero-text { + color: var(--color-gray); +} + +/* Results section */ +.results { + background-color: #fff; +} + +.results .buttons { + display: flex; + flex-wrap: wrap; + justify-content: center; + gap: 1.25 rem; + margin-top: var(--spacing-md); +} + +.results .title { + text-align: center; + color: var(--color-navy); +} + +.results h3 { + margin-top: var(--spacing-sm); + text-align: center; +} + +.results h4 { + margin-top: var(--spacing-md); +} + +.result-list { + display: flex; + flex-direction: column; + gap: 1rem; + margin: var(--spacing-sm) 0 var(--spacing-sm); + list-style: disc outside; + padding-left: 1.4rem; + color: var(--color-gray); +} + +.result-list li > span:not(.authors), +.result-list li::marker { + color: #000; + font-weight: 600; +} + +.result-list li > span.authors { + display: block; + margin-top: 0.5rem; + font-size: 1rem; +} + +.result-list li > span.authors > span { + color: #000; + font-weight: 600; +} + +/* Tracks section */ +.tracks { + background-color: var(--color-light-gray); +} + +.tracks .title { + text-align: center; +} + +.tracks .title > h2 { + color: var(--color-navy); + margin-bottom: var(--spacing-sm); +} + +.tracks .title > p { + color: var(--color-gray); +} + +.tracks-list { + display: flex; + flex-direction: column; + gap: 1.75rem; + margin: var(--spacing-md) 0; + list-style: disc outside; + padding-left: 1.4rem; + color: var(--color-gray); +} + +.tracks-list li > span, +.tracks-list li::marker { + color: #000; + font-weight: 600; +} + +.table-notes { + display: block; + text-align: center; + margin-top: var(--spacing-sm); + font-size: 1rem; +} + +.table-notes > a { + text-decoration: none; + color: var(--color-blue); +} + +/* Table */ +.table-container { + text-align: center; + overflow-x: auto; +} + +.group-border { + border-right: 3px solid #738fab; +} + +table { + border-collapse: collapse; + font-size: 1rem; + margin: 0 auto; +} + +th, +td { + border: 2px solid #738fab; + padding: 0.75rem; +} + +th { + background-color: #25239d; + color: #fff; +} + +/* Participation */ +.participate { + background-color: #fff; +} + +.participate h2 { + text-align: center; + color: var(--color-navy); +} + +.participate-section { + margin-top: var(--spacing-md); +} + +.participate-section > ul { + padding-left: 1.4rem; + margin-top: var(--spacing-sm); + display: flex; + flex-direction: column; + gap: var(--spacing-sm); +} + +.participate-section > ul > li span { + font-weight: 600; +} + +/* Contributor section */ + +.organizers { + background-color: var(--color-light-gray); +} + +.organizers > .container { + display: flex; + flex-direction: column; + align-items: center; + gap: var(--spacing-md); +} + +.organizers .title { + text-align: center; +} + +.organizers .title > h2 { + color: var(--color-navy); +} + +.organizers .title > p { + color: var(--color-gray); + margin: var(--spacing-sm) auto 0; + max-width: 54rem; +} + +.organizer-grid { + display: flex; + flex-wrap: wrap; + justify-content: center; + row-gap: var(--spacing-sm); + column-gap: var(--spacing-md); + max-width: 59.375rem; +} + +.organizer { + width: 10.2rem; +} + +.organizer > img { + width: 9.8125rem; + height: 9.8125rem; + object-fit: cover; + border-radius: 5px; +} + +.organizer .name { + display: block; + font-size: 1.25rem; + font-weight: 600; + color: #0a2540; +} + +.organizer .role { + display: block; + font-size: 1rem; + color: var(--color-gray); +} + +.organizer .image-border { + border: 1px solid var(--color-navy); +} + +.organizers .presented-by { + color: var(--color-navy); +} + +@media only screen and (min-width: 768px) { + .container { + padding: 0 2.5rem; + } + + .content-section { + padding-top: var(--spacing-lg); + padding-bottom: var(--spacing-lg); + } + + p, + li { + font-size: 1.25rem; + line-height: 1.75rem; + } + + h1 { + font-size: 3.75rem; + line-height: 4.125rem; + } + + h2 { + font-size: 2.75rem; + line-height: 3.3rem; + } + + h3 { + font-size: 1.875rem; + line-height: 2.25rem; + } + + h4 { + font-size: 1.5rem; + } + + .button { + width: auto; + } + + .header nav { + display: block; + } + + .tracks-list { + margin: var(--spacing-lg) 0; + } + + .participate-section { + margin-top: var(--spacing-lg); + } + + .organizers > .container { + gap: var(--spacing-lg); + } + + .organizer-grid { + row-gap: var(--spacing-md); + column-gap: var(--spacing-lg); + } + + .presented-by { + font-size: 1.875rem; + line-height: 2.25rem; + } + + .presented-by .microsoft-logo, + .presented-by .pinecone-logo { + width: 10rem; + height: auto; + } + + .presented-by .aws-logo { + width: 3.5rem; + height: auto; + } +} + +@media only screen and (min-width: 1024px) { + .header .external-links { + display: flex; + } + + .footer > .container { + flex-direction: row; + } +} diff --git a/t1_t2/README.md b/t1_t2/README.md deleted file mode 100644 index 22cec24be..000000000 --- a/t1_t2/README.md +++ /dev/null @@ -1,296 +0,0 @@ -# T1 and T2 Tracks - -## Table Of Contents - -- [Introduction](#introduction) -- [For Participants](#for_participants) - - [Getting Started](#getting_started) - - [Starting Your Development](#starting_your_development) - - [Developing Your Dockerfile](#developing_your_dockerfile) - - [Developing Your Algorithm](#developing_your_algorithm) - - [Measuring your Algorithm](#measuring_your_algorithm) - - [How To Get Help](#how_to_get_help) - - [Leaderboard](#leaderboard) -- [For Evaluators](#for_organizers) - -## Introduction - -The T1 and T2 tracks evaluate algorithms on standardized Azure CPU servers. - -**Track 1**: In-memory indices with [FAISS](https://github.com/facebookresearch/faiss) as the baseline. Search would use Azure [Standard_F32s_v2 VMs](https://docs.microsoft.com/en-us/azure/virtual-machines/fsv2-series) with 32 vCPUs and 64GB RAM. - -**Track 2:** Out-of-core indices with [DiskANN](https://github.com/Microsoft/diskann) as the baseline. In addition to the limited DRAM in T1, index can use an SSD for search. Search would use Azure [Standard_L8s_v2 VMs](https://docs.microsoft.com/en-us/azure/virtual-machines/lsv2-series) with 8 vCPUS, 64GB RAM and a local SSD Index constrained to 1TB. - -Index construction for both tracks would use Azure [Standard_F64s_v2 VM](https://docs.microsoft.com/en-us/azure/virtual-machines/fsv2-series) with 64vCPUs, 128GB RAM and an additional [4TB of Premium SSD](https://docs.microsoft.com/en-us/azure/virtual-machines/disks-types) to be used for storing the data, index and other intermediate data. There is a **time limit for 4 days per dataset** for index build. - -Queries will be supplied in one shot and the algorithm can execute the queries in any order. - -We will release plots for recall vs QPS separately for tracks T1 and T2. -Additionally, we will release leaderboards for T1 and T2. The metric for the leaderboard in each track will be the sum of improvements in recall over the baseline at the target QPS over all datasets. **The target recall -for T1 is 10000 QPS and for T2 is 1500 QPS.** - -Participants must submit their algorithm via a pull request and (optionally) index file(s) upload (one per participating dataset). - - -## For_Participants - -### Requirements - -You will need the following installed on your machine: -* Python ( we tested with Anaconda using an environment created for Python version 3.8 ) and Docker. -* Note that we tested everything on Ubuntu Linux 18.04 but other environments should be possible. - -### Getting_Started - -This section will present a small tutorial about how to use this framework and several of the key scripts you will use throughout the development of your algorithm and eventual submission. - -First, clone this repository and cd into the project directory: -``` -git clone -cd -``` -Install the python package requirements: -``` -pip install -r requirements_py38.txt -``` -Create a small, sample dataset. For example, to create a dataset with 10000 20-dimensional random floating point vectors, run: -``` -python create_dataset.py --dataset random-xs -``` -To create a smaller slice of the competition datasets (e.g. 10M slice of deep-1B), run: -``` -python create_dataset.py --dataset deep-10M -``` -To see a complete list of datasets, run the following: -``` -python create_dataset.py --help -``` - -For T2, set up the local SSD on Azure Ls8v2 machine by running the following under sudo. -``` -parted /dev/nvme0n1 mklabel gpt mkpart primary 0% 100%; -mkfs -t ext4 /dev/nvme0n1; -mkdir /nvme; -mount /dev/nvme0n1 /nvme/; -echo "/dev/nvme0n1 /nvme ext4 defaults 0 0" >> /etc/fstab; -``` -You might also want to create a symbolic link to a folder under `/nvme` -``` -sudo mkdir /nvme/data -sudo chmod 777 /nvme/data -ln -s /nvme/data data -``` - -Build the docker container for the T1 or T2 baselines: -``` -#for T1 -python install.py --algorithm faissconda -#for T2 -python install.py --algorithm diskann -``` -Run a benchmark evaluation using the algorithm's definition file: -``` -python run.py --algorithm faiss_t1 --dataset random-xs -python run.py --algorithm diskann-t2 --dataset random-xs -``` - -For the competition dataset (e.g. deep-1B), running the following command downloads a prebuilt index and runs the queries locally. -``` -python run.py --algorithm faiss_t1 --dataset deep-1B -python run.py --algorithm diskann-t2 --dataset deep-1B -``` - -Now plot QPS vs recall: -``` -python plot.py --algorithm faiss_t1 --dataset random-xs -python plot.py --algorithm diskann-t2 --dataset random-xs -``` -This will place a plot into the *results/* directory. - -### Starting_Your_Development - -First, please create a short name for your team without spaces or special characters. Henceforth in these instructions, this will be referenced as [your_team_name]. - -Create a custom branch off main in this repository: -``` -# For t1 -git checkout -b t1/[your_team_name] -# For t2 -git checkout -b t2/[your_team_name] -``` - - -### Developing_Your_Dockerfile - -This framework evaluates algorithms in Docker containers by default. Your algorithm's Dockerfile should live in *install/Docker.[your_team_name]*. Your Docker file should contain everything needed to install and run your algorithm on a system with the same hardware. - -Please consult the Dockerfiles [here](../install/Dockerfile.faissconda) and [here](../install/Dockerfile.diskann) for examples. - -To build your Docker container, run: -``` -python install.py --install [your_team_name] -``` - -### Developing_Your_Algorithm - -Develop and add your algorithm's python class to the [benchmark/algorithms](../benchmark/algorithms) directory. -* You will need to subclass from the [BaseANN class](../benchmark/algorithms/base.py) and implement the functions of that parent class. -* You should consult the examples already in the directory. -* If it is difficult to write a Python wrapper, please consult [HttpANN](../benchmark/algorithms/httpann_example.py) for a RESTful API. - - -When you are ready to test on the competition datasets, use the create_dataset.py script as follows: -``` -python create_dataset.py --dataset [sift-1B|bigann-1B|text2image-1B|msturing-1B|msspacev-1B|ssnpp-1B] -``` -To benchmark your algorithm, first create an algorithm configuration yaml in your teams directory called *algos.yaml.* This file contains the index build parameters and query parameters that will get passed to your algorithm at run-time. Please look at [algos.yaml](../algos.yaml). - -If your machine is capable of both building and searching an index, you can benchmark your algorithm using the run.py script. -``` -python run.py --algorithm diskann-t2 --dataset deep-1B -``` -This will write the results to the toplevel [results](../results) directory. - -To build the index and upload it to Azure cloud storage without querying it: -``` -python run.py --algorithm diskann-t2 --dataset deep-1B --upload-index --blob-prefix --sas-string -``` -To download the index from cloud storage and query it on another machine: -``` -python run.py --algorithm diskann-t2 --dataset deep-1B --download-index --blob-prefix --sas-string -``` - -### Measuring_Your_Algorithm - - -Now you can analyze the results using plot.py. Sudo might be required here. To avoid sudo, run `sudo chmod -R 777 results/` before invoking these scripts. -``` -python plot.py --algorithm [your_team_name] --dataset deep-1B -``` -This will place a plot of the algorithms performance into the toplevel [results](../results) directory. - -The plot.py script supports other benchmarks. To see a complete list, run: -``` -python plot.py --help -``` - -You can plot additional metrics, e.g. mean SSD IOs vs recall/AP for T2, using: -``` -python plot.py --dataset deep-1B -x k-nn -y mean_ssd_ios -``` - - -Here are all the FAISS baseline recall@10 (AP for SSNPP) vs throughput plots for T1: -* [msturing-1B](results/T1/msturing-1B.png) -* [bigann-1B](results/T1/bigann-1B.png) -* [text2image-1B](results/T1/text2image-1B.png) -* [deep-1B](results/T1/deep-1B.png) -* [msspacev-1B](results/T1/msspacev-1B.png) -* [ssnpp-1B](results/T1/ssnpp-1B.png) - -Here are all the DiskANN baseline recall@10 (AP for SSNPP) vs throughput plots for T2: -* [msturing-1B](results/T2/msturing-1B.png) -* [bigann-1B](results/T2/bigann-1B.png) -* [text2image-1B](results/T2/text2image-1B.png) -* [deep-1B](results/T2/deep-1B.png) -* [msspacev-1B](results/T2/msspacev-1B.png) -* [ssnpp-1B](results/T2/ssnpp-1B.png) - - -Here are all the DiskANN baseline recall@10 (AP for SSNPP) vs mean SSD IOs plots for T2: -* [msturing-1B](results/T2/msturing-1B-IO.png) -* [bigann-1B](results/T2/bigann-1B-IO.png) -* [text2image-1B](results/T2/text2image-1B-IO.png) -* [deep-1B](results/T2/deep-1B-IO.png) -* [msspacev-1B](results/T2/msspacev-1B-IO.png) -* [ssnpp-1B](results/T2/ssnpp-1B-IO.png) - -To get a table overview over the best recall/ap achieved over a certain QPS threshold, run -``` -python3 data_export.py --output res.csv -python3 eval/show_operating_points.py --algorithm $ALGO --threshold $THRESHOLD res.csv -``` - -For the track1 baseline, the output, this led to - -``` - recall/ap -algorithm dataset -faiss-t1 bigann-1B 0.634510 - deep-1B 0.650280 - msspacev-1B 0.728861 - msturing-1B 0.703611 - ssnpp-1B 0.753780 - text2image-1B 0.069275 -``` - -For the track2 baseline, this led to - -``` - recall/ap -algorithm dataset -diskann-t2 bigann-1B 0.94913 - deep-1B 0.93706 - msspacev-1B 0.90095 - msturing-1B 0.93564 - ssnpp-1B 0.16274 - text2image-1B 0.48854 -``` - -### Submitting_Your_Algorithm - -A submission is composed of a pull request to this repo with the following. -* Your algorithm's python class, inheriting from `BaseANN`, placed in the [benchmark/algorithms/](../benchmark/algorithms) directory. -* A Dockerfile in `install/` describing how to retrieve, compile and set up requirements for your algorithm. -* For each dataset you are participating in, add to [algos.yaml](../algos.yaml) - * 1 index build configuration - * 10 search configuration -* Add an entry to [CI test list](../.github/workflows/benchmarks.yml) for the random-xs dataset, and for the random-range-xs dataset if your algorithm supports range search. We can start working with larger datasets once these tests pass. -* An URL to download any prebuilt indices placed in `algos.yaml`. **This is optional, but strongly encourages.** This would help us evaluate faster, although we would build your index to verify the time limit. Please see `faiss_t1.py` and `diskann-t2.py` for examples. If you are unable to host the index on your own Azure blob storage, please let us know and we can arrange to have it copied to organizer's account. - -We will run early PRs on organizer's machines to the extent possible and provide any feedback necessary. - -### How_To_Get_Help - -There are several ways to get help as you develop your algorithm using this framework: -* You can submit an issue at this github repository. -* Send an email to the competition's T1/T2 organizer, harsha.v.simhadri@gmail.com -* Send en email to the competition's googlegroup, big-ann-organizers@googlegroups.com - -### Leaderboard - -This leaderboard is based on the standard recall@10 vs throughput benchmark that has become a standard benchmark when evaluating and comparing approximate nearest neighbor algorithms. We have run FAISS and DiskANN as baselines for T1 and T2 respectively, and for each dataset chosen the best recall amongst configurations providing at least **10K QPS for T1 and 1500 QPS for T2**. The recall of the baselines at this QPS threshold is listed [above](#measuring_your_algorithm). - -Algorithms will be ranked on how much their recall surpasses the baselines at these QPS thresholds. We will add up the recall improvements of each algorithm on all data sets it competes on. Participants are required to commit to at least 3 datasets, and ideally more. Algorithms that work on more datasets are at an advantage as they can benefit from additional scores. Any recall regression compared to the baseline on the datasets committed to will be subtracted from the final score. - -#### Results for T1 -The table lists best Recall/AP obtained at at least 10,000 QPS by algorithms in pull requests submitted before Nov 2021. All non-empty cells are derived from author-published indices that succesfully ran on the standardized hardware with author-provided query configurations. Recall for bigann-1B does not count ties. This result is on the public query set. - - -| PR | Name |bigann-1B | deep-1B | msspacev-1B | msturing-1B | ssnpp-1B | text2image-1B | -|----|-----------|-----------|---------|-------------|-------------|-----------|-----------------| -| 58 | team11 | | 0.64955 | | 0.712211 | | | -| 60 | puck-t1 |0.71468 | 0.72255 | | | | | -| 66 | ngt-t1 | | | | | | | -| 69 | kst_ann_t1| .71219 | 0.71219 | 0.764542 | 0.756419 | | | -| 71 | buddy-t1 | 0.62765 | | | | | | -|-----|-----------|-----------|---------|-------------|-------------|-----------|----------------| -| | baseline | 0.63451 | 0.65028 | 0.728861 | 0.703611 | 0.75378 | 0.069275 | -|-----|-----------|-----------|---------|-------------|-------------|-----------|----------------| - - -#### Results for T2 -The table lists best Recall/AP obtained at at least 1,500 QPS by algorithms in pull requests submitted before Nov 2021. All non-empty cells are derived from author-published indices that succesfully ran on the standardized hardware with author-provided query configurations. Recall for bigann-1B does not count ties. This result is on the public query set. - - -| PR | Name |bigann-1B | deep-1B | msspacev-1B | msturing-1B | ssnpp-1B | text2image-1B | -|----|-----------|-----------|---------|-------------|-------------|-----------|----------------| -| 62 | kota-t2 | 0.950859 | | 0.904001 | 0.939817 | 0.18212 | | -| 66 | ngt-t2 | | | | | | | -| 70 | bbann | | | 0.7602 | | 0.88573 | 0.495423 | -|----|-----------|-----------|---------|-------------|-------------|-----------|----------------| -| | baseline | 0.94913 | 0.93706 | 0.90095 | 0.93564 | 0.16274 | 0.48854 | -|----|-----------|-----------|---------|-------------|-------------|-----------|----------------| - -## For_Evaluators - diff --git a/t1_t2/results/T1/bigann-1B.png b/t1_t2/results/T1/bigann-1B.png deleted file mode 100644 index 82df3c71d..000000000 Binary files a/t1_t2/results/T1/bigann-1B.png and /dev/null differ diff --git a/t1_t2/results/T1/deep-1B.png b/t1_t2/results/T1/deep-1B.png deleted file mode 100644 index b90291c0f..000000000 Binary files a/t1_t2/results/T1/deep-1B.png and /dev/null differ diff --git a/t1_t2/results/T1/msspacev-1B.png b/t1_t2/results/T1/msspacev-1B.png deleted file mode 100644 index 3432fd1d3..000000000 Binary files a/t1_t2/results/T1/msspacev-1B.png and /dev/null differ diff --git a/t1_t2/results/T1/msturing-1B.png b/t1_t2/results/T1/msturing-1B.png deleted file mode 100644 index 357d90f19..000000000 Binary files a/t1_t2/results/T1/msturing-1B.png and /dev/null differ diff --git a/t1_t2/results/T1/ssnpp-1B.png b/t1_t2/results/T1/ssnpp-1B.png deleted file mode 100644 index f2b7b4cdc..000000000 Binary files a/t1_t2/results/T1/ssnpp-1B.png and /dev/null differ diff --git a/t1_t2/results/T1/text2image-1B.png b/t1_t2/results/T1/text2image-1B.png deleted file mode 100644 index 6cf0598a5..000000000 Binary files a/t1_t2/results/T1/text2image-1B.png and /dev/null differ diff --git a/t1_t2/results/T2/bigann-1B-IO.png b/t1_t2/results/T2/bigann-1B-IO.png deleted file mode 100644 index 9e0b6aa9e..000000000 Binary files a/t1_t2/results/T2/bigann-1B-IO.png and /dev/null differ diff --git a/t1_t2/results/T2/bigann-1B.png b/t1_t2/results/T2/bigann-1B.png deleted file mode 100644 index fe44fd88a..000000000 Binary files a/t1_t2/results/T2/bigann-1B.png and /dev/null differ diff --git a/t1_t2/results/T2/deep-1B-IO.png b/t1_t2/results/T2/deep-1B-IO.png deleted file mode 100644 index a636ca6af..000000000 Binary files a/t1_t2/results/T2/deep-1B-IO.png and /dev/null differ diff --git a/t1_t2/results/T2/deep-1B.png b/t1_t2/results/T2/deep-1B.png deleted file mode 100644 index 2fe899b4d..000000000 Binary files a/t1_t2/results/T2/deep-1B.png and /dev/null differ diff --git a/t1_t2/results/T2/msspacev-1B-IO.png b/t1_t2/results/T2/msspacev-1B-IO.png deleted file mode 100644 index 0130c437e..000000000 Binary files a/t1_t2/results/T2/msspacev-1B-IO.png and /dev/null differ diff --git a/t1_t2/results/T2/msspacev-1B.png b/t1_t2/results/T2/msspacev-1B.png deleted file mode 100644 index 5253f0cd8..000000000 Binary files a/t1_t2/results/T2/msspacev-1B.png and /dev/null differ diff --git a/t1_t2/results/T2/msturing-1B-IO.png b/t1_t2/results/T2/msturing-1B-IO.png deleted file mode 100755 index 08541aefa..000000000 Binary files a/t1_t2/results/T2/msturing-1B-IO.png and /dev/null differ diff --git a/t1_t2/results/T2/msturing-1B.png b/t1_t2/results/T2/msturing-1B.png deleted file mode 100644 index 351ae5604..000000000 Binary files a/t1_t2/results/T2/msturing-1B.png and /dev/null differ diff --git a/t1_t2/results/T2/res.csv b/t1_t2/results/T2/res.csv deleted file mode 100644 index e032ae062..000000000 --- a/t1_t2/results/T2/res.csv +++ /dev/null @@ -1,60 +0,0 @@ -algorithm,parameters,dataset,count,qps,distcomps,build,indexsize,queriessize,wspq,recall/ap -diskann-t2,DiskANN,bigann-1B,10,1692.271479416587,0.0,1000000.0,60384120.0,35682.28900295449,inf,0.9426500000000001 -diskann-t2,DiskANN,bigann-1B,10,1979.5720516956515,0.0,1000000.0,60384120.0,30503.623219107627,inf,0.9246700000000001 -diskann-t2,DiskANN,bigann-1B,10,1498.447251013022,0.0,1000000.0,60384120.0,40297.79490681267,inf,0.9549200000000001 -diskann-t2,DiskANN,bigann-1B,10,1395.0126358562839,0.0,1000000.0,60384120.0,43285.71544653797,inf,0.9599399999999999 -diskann-t2,DiskANN,bigann-1B,10,1449.7409112948683,0.0,1000000.0,60384120.0,41651.66308652115,inf,0.95691 -diskann-t2,DiskANN,bigann-1B,10,1173.2852848995394,0.0,1000000.0,60384120.0,51465.84618179226,inf,0.9699899999999999 -diskann-t2,DiskANN,bigann-1B,10,1310.0846908052526,0.0,1000000.0,60384120.0,46091.76828322792,inf,0.96411 -diskann-t2,DiskANN,bigann-1B,10,1594.14800808084,0.0,1000000.0,60384120.0,37878.615846150395,inf,0.94913 -diskann-t2,DiskANN,bigann-1B,10,981.8258342866466,0.0,1000000.0,60384120.0,61501.86508778572,inf,0.97882 -diskann-t2,DiskANN,bigann-1B,10,2303.0911898705594,0.0,1000000.0,60384120.0,26218.727363285067,inf,0.89605 -diskann-t2,DiskANN,deep-1B,10,1660.8887581780666,0.0,1000000.0,60630840.0,36505.05772976017,inf,0.9279400000000001 -diskann-t2,DiskANN,deep-1B,10,1990.253305673633,0.0,1000000.0,60630840.0,30463.88106838417,inf,0.90432 -diskann-t2,DiskANN,deep-1B,10,2307.308080428008,0.0,1000000.0,60630840.0,26277.73920366669,inf,0.8766400000000001 -diskann-t2,DiskANN,deep-1B,10,1021.5658500041819,0.0,1000000.0,60630840.0,59350.88765912819,inf,0.96555 -diskann-t2,DiskANN,deep-1B,10,1525.294026026525,0.0,1000000.0,60630840.0,39750.26386089421,inf,0.93706 -diskann-t2,DiskANN,deep-1B,10,1551.8613031064206,0.0,1000000.0,60630840.0,39069.75441596031,inf,0.93448 -diskann-t2,DiskANN,deep-1B,10,1725.2463398347454,0.0,1000000.0,60630840.0,35143.29438067818,inf,0.92354 -diskann-t2,DiskANN,deep-1B,10,1349.5413709825298,0.0,1000000.0,60630840.0,44926.99616600704,inf,0.9466699999999999 -diskann-t2,DiskANN,deep-1B,10,1220.8964718445557,0.0,1000000.0,60630840.0,49660.91834829998,inf,0.9545299999999999 -diskann-t2,DiskANN,deep-1B,10,1600.3843696590948,0.0,1000000.0,60630840.0,37885.17380541229,inf,0.9320600000000001 -diskann-t2,DiskANN,msspacev-1B,10,883.7119232408137,0.0,1000000.0,57424484.0,64980.999452184245,inf,0.914753035884841 -diskann-t2,DiskANN,msspacev-1B,10,824.5735527738586,0.0,1000000.0,57424484.0,69641.43320729183,inf,0.9160526674853322 -diskann-t2,DiskANN,msspacev-1B,10,950.6840259594734,0.0,1000000.0,57424484.0,60403.333212677695,inf,0.9133817710465275 -diskann-t2,DiskANN,msspacev-1B,10,1122.9665691083565,0.0,1000000.0,57424484.0,51136.41454669079,inf,0.9097182425978987 -diskann-t2,DiskANN,msspacev-1B,10,1505.677457711673,0.0,1000000.0,57424484.0,38138.635672525554,inf,0.9009551098376314 -diskann-t2,DiskANN,msspacev-1B,10,1702.1793320297897,0.0,1000000.0,57424484.0,33735.860211346415,inf,0.8958520944194296 -diskann-t2,DiskANN,msspacev-1B,10,1226.7363205846661,0.0,1000000.0,57424484.0,46810.779982964326,inf,0.9076204120616728 -diskann-t2,DiskANN,msspacev-1B,10,1981.1706313882712,0.0,1000000.0,57424484.0,28985.12782806637,inf,0.8887331150225133 -diskann-t2,DiskANN,msspacev-1B,10,1030.4179244402635,0.0,1000000.0,57424484.0,55729.31393948114,inf,0.91110997407559 -diskann-t2,DiskANN,msspacev-1B,10,1346.1162781430423,0.0,1000000.0,57424484.0,42659.37863794104,inf,0.9046800382043936 -diskann-t2,DiskANN,text2image-1B,10,2659.429096957006,0.0,1000000.0,63315692.0,23808.001526510936,0.27174 -diskann-t2,DiskANN,text2image-1B,10,1084.2778991135426,0.0,1000000.0,63315692.0,58394.33972763264,0.59194 -diskann-t2,DiskANN,text2image-1B,10,1987.4666943394475,0.0,1000000.0,63315692.0,31857.485803576466,0.384928 -diskann-t2,DiskANN,text2image-1B,10,950.2152736328754,0.0,1000000.0,63315692.0,66632.99755005055,0.6246579999999999 -diskann-t2,DiskANN,text2image-1B,10,1529.0100796529537,0.0,1000000.0,63315692.0,41409.59751839638,0.488544 -diskann-t2,DiskANN,text2image-1B,10,1011.6194816882818,0.0,1000000.0,63315692.0,62588.446689789984,0.609235 -diskann-t2,DiskANN,text2image-1B,10,1382.9423353887794,0.0,1000000.0,63315692.0,45783.32037409238,0.521979 -diskann-t2,DiskANN,text2image-1B,10,1715.704209800216,0.0,1000000.0,63315692.0,36903.61755734851,0.445646 -diskann-t2,DiskANN,text2image-1B,10,1166.7836574132612,0.0,1000000.0,63315692.0,54265.15155377628,0.572158 -diskann-t2,DiskANN,text2image-1B,10,1265.0557338512756,0.0,1000000.0,63315692.0,50049.72532494257,0.549218 -diskann-t2,DiskANN,msturing-1B,10,1488.9374886469645,0.0,1000000.0,60662240.0,40741.96563827896,0.937403 -diskann-t2,DiskANN,msturing-1B,10,1283.6399190951693,0.0,1000000.0,60662240.0,47257.988083418655,0.946902 -diskann-t2,DiskANN,msturing-1B,10,1439.2729152786703,0.0,1000000.0,60662240.0,42147.83683902969,0.939912 -diskann-t2,DiskANN,msturing-1B,10,1160.2685821000873,0.0,1000000.0,60662240.0,52282.929087161254,0.952509 -diskann-t2,DiskANN,msturing-1B,10,1871.1431910244708,0.0,1000000.0,60662240.0,32419.881220734784,0.918614 -diskann-t2,DiskANN,msturing-1B,10,1454.2011212492587,0.0,1000000.0,60662240.0,41715.165195228954,0.939076 -diskann-t2,DiskANN,msturing-1B,10,1526.0685111801067,0.0,1000000.0,60662240.0,39750.66620900917,0.935642 -diskann-t2,DiskANN,msturing-1B,10,2198.1542303679685,0.0,1000000.0,60662240.0,27596.898871761703,0.900497 -diskann-t2,DiskANN,msturing-1B,10,1623.0586342268134,0.0,1000000.0,60662240.0,37375.26095531235,0.9310269999999999 -diskann-t2,DiskANN,msturing-1B,10,972.1252420784929,0.0,1000000.0,60662240.0,62401.671486586,0.960867 -diskann-t2,DiskANN,ssnpp-1B,60000,1333.8432820515925,0.0,1000000.0,62999136.0,47231.28784897477,0.178445601986414 -diskann-t2,DiskANN,ssnpp-1B,60000,1856.1525168484525,0.0,1000000.0,62999136.0,33940.710921194,0.1457741211862014 -diskann-t2,DiskANN,ssnpp-1B,60000,2093.526127890431,0.0,1000000.0,62999136.0,30092.357177066573,0.13150131209619825 -diskann-t2,DiskANN,ssnpp-1B,60000,1715.8090468634405,0.0,1000000.0,62999136.0,36716.868998426515,0.1627462515985982 -diskann-t2,DiskANN,ssnpp-1B,60000,1319.99508156511,0.0,1000000.0,62999136.0,47726.796016014174,0.15215346231460414 -diskann-t2,DiskANN,ssnpp-1B,60000,1316.7561211606983,0.0,1000000.0,62999136.0,47844.1945228759,0.178445601986414 -diskann-t2,DiskANN,ssnpp-1B,60000,2409.745042633539,0.0,1000000.0,62999136.0,26143.486088947448,0.12175038200269063 -diskann-t2,DiskANN,ssnpp-1B,60000,1866.6323831709003,0.0,1000000.0,62999136.0,33750.157003588254,0.1457741211862014 -diskann-t2,DiskANN,ssnpp-1B,60000,1299.947787665343,0.0,1000000.0,62999136.0,48462.82027460816,0.195030279941537 diff --git a/t1_t2/results/T2/ssnpp-1B-IO.png b/t1_t2/results/T2/ssnpp-1B-IO.png deleted file mode 100755 index d50aa2eac..000000000 Binary files a/t1_t2/results/T2/ssnpp-1B-IO.png and /dev/null differ diff --git a/t1_t2/results/T2/ssnpp-1B.png b/t1_t2/results/T2/ssnpp-1B.png deleted file mode 100755 index a450a2b11..000000000 Binary files a/t1_t2/results/T2/ssnpp-1B.png and /dev/null differ diff --git a/t1_t2/results/T2/text2image-1B-IO.png b/t1_t2/results/T2/text2image-1B-IO.png deleted file mode 100755 index 6a136e388..000000000 Binary files a/t1_t2/results/T2/text2image-1B-IO.png and /dev/null differ diff --git a/t1_t2/results/T2/text2image-1B.png b/t1_t2/results/T2/text2image-1B.png deleted file mode 100644 index e7caf1ada..000000000 Binary files a/t1_t2/results/T2/text2image-1B.png and /dev/null differ diff --git a/t3/LB_history/Dec.2.2021/LEADERBOARDS.md b/t3/LB_history/Dec.2.2021/LEADERBOARDS.md deleted file mode 100644 index 7a8a1031f..000000000 --- a/t3/LB_history/Dec.2.2021/LEADERBOARDS.md +++ /dev/null @@ -1,571 +0,0 @@ -# T3 Track Leaderboards (Unofficial) - -Please note that all rankings are currently unofficial due to the following reasons: -* All [open tasks and issues](TASKS_ISSUES_RESOLUTIONS.md) must be resolved. - -## Final Rankings On Private Query Set - -*Not yet available* - -## Rankings On Public Query Set - -### Rankings By Submission Name (alphabetical) - -|Submission |Team |Hardware |[Recall Rank](#recall-or-ap-rankings)|[Thru-put Rank](#throughput-rankings)|[Power Rank](#power-rankings)|[Cost Rank](#cost-rankings)|Status |Anomalies|Evaluator|Algo |Runs | -|--------------------|-----------|----------|---------|---------|---------|--------|---------|---------|---------|---------|--------| -|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |[1](#recall-or-ap-rankings) |[5](#throughput-rankings) |*NQ* |*NQ* |final |*NA* |Harsha Simhadri |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/diskann-t2.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/EvalPublic.ipynb) | -|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |[6](#recall-or-ap-rankings) |[6](#throughput-rankings) |[5](#power-rankings) |[5](#cost-rankings) |final |0/58 |George Williams |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/faiss_t3.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/EvalPublic.ipynb) | -|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |[4](#recall-or-ap-rankings) |[4](#throughput-rankings) |[4](#power-rankings) |[4](#cost-rankings) |final |0/60 |George Williams |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/gemini.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/EvalPublic.ipynb) | -|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |[3](#recall-or-ap-rankings) |[3](#throughput-rankings) |[1](#power-rankings) |[2](#cost-rankings)\*\* |final |[5/50](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/ANOMALIES.md) |George Williams |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/cuanns_ivfpq.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/EvalPublic.ipynb) | -|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |[5](#recall-or-ap-rankings) |[1](#throughput-rankings) |[3](#power-rankings) |[3](#cost-rankings)\*\* |final |[4/40](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/ANOMALIES.md) |George Williams |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/cuanns_multigpu.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/EvalPublic.ipynb) | -|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |[2](#recall-or-ap-rankings) |[2](#throughput-rankings) |[2](#power-rankings) |[1](#cost-rankings)|final |[5/50](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/ANOMALIES.md) |George Williams |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/graphann.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/EvalPublic.ipynb)| - -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - * *NQ* = not qualified - * *NA* = data is not yet available, or has not yet been processed - -* *Anomalies* are defined as queries that could potentially be the result of query response caching, a violation of the competition. Our detection method looks for a 30% or more improvement in the batch query latency between the first and last query of a query group (5). Participants have been given a chance to explain why detected anomalies (if any) are not a result of query response caching. - -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -### Rankings Per Metric - -#### Recall Or AP Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-recall-rankings)|[BigANN](#bigann-recall-rankings)|[MSTuring](#msturing-recall-rankings)|[MSSpace](#msspace-recall-rankings)|[Text2Image](#text2image-recall-rankings)|[FBSSNet](#fbsimsearchnet-ap-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|-------| -| 1|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md)|Microsoft Research India(*org*)|Dell PowerEdge |final|**0.410**|[0.99821](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/deep-1B_recall.png) |[0.99976](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/bigann-1B_recall.png) |[0.99444](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msturing-1B_recall.png) |[0.99342](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msspacev-1B_recall.png) |[0.98130](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/text2image-1B_recall.png) |- | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |final|**0.409**|[0.99882](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_recall.png) |[0.99978](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_recall.png) |[0.99568](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_recall.png) |[0.99835](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_recall.png) |[0.97340](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_recall.png) |- | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |final|**0.368**|[0.99541](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_recall.png) |[0.99882](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_recall.png) |[0.98993](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_recall.png) |[0.99428](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_recall.png) |[0.94691](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_recall.png) |- | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |final|**0.339**|[0.99208](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_recall.png) |[0.99328](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_recall.png) |[0.97841](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_recall.png) |[0.98622](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_recall.png) |[0.92855](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_recall.png) |[0.99684](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_recall.png) | -| 5|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |final|**0.268**|[0.99504](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_recall.png) |[0.99815](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_recall.png) |[0.98399](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_recall.png) |[0.98785](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_recall.png) |- |- | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|[0.94275](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_recall.png) |[0.93260](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_recall.png) |[0.91322](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_recall.png) |[0.90853](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_recall.png) |[0.86028](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_recall.png) |[0.97863](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_recall.png) | - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -#### Throughput Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-throughput-rankings)|[BigANN](#bigann-throughput-rankings)|[MSTuring](#msturing-throughput-rankings)|[MSSpace](#msspace-throughput-rankings)|[Text2Image](#text2image-throughput-rankings)|[FBSSNet](#fbsimsearchnet-throughput-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|--------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |final|**3001623.821**|[816,807](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_throughput.png) |[767,653](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_throughput.png) |[586,722](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_throughput.png) |[844,287](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_throughput.png) |- |- | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |final|**853256.879**|[196,546](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_throughput.png) |[335,991](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_throughput.png) |[161,463](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_throughput.png) |[157,828](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_throughput.png) |[17,063](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_throughput.png) |- | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |final|**401541.475**|[91,938](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_throughput.png) |[85,446](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_throughput.png) |[110,830](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_throughput.png) |[109,621](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_throughput.png) |[19,340](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_throughput.png) |- | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |final|**52429.395**|[10,704](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_throughput.png) |[10,672](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_throughput.png) |[21,780](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_throughput.png) |[16,422](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_throughput.png) |[4,838](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_throughput.png) |[9,345](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_throughput.png) | -| 5|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md)|Microsoft Research India(*org*)|Dell PowerEdge |final|**49398.127**|[12,927](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/deep-1B_throughput.png) |[19,094](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/bigann-1B_throughput.png) |[17,201](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msturing-1B_throughput.png) |[6,503](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msspacev-1B_throughput.png) |[9,307](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/text2image-1B_throughput.png) |- | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|[4,464](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_throughput.png) |[3,271](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_throughput.png) |[2,845](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_throughput.png) |[3,265](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_throughput.png) |[1,789](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_throughput.png) |[5,699](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_throughput.png) | - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -#### Power Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-power-rankings)|[BigANN](#bigann-power-rankings)|[MSTuring](#msturing-power-rankings)|[MSSpace](#msspace-power-rankings)|[Text2Image](#text2image-power-rankings)|[FBSSNet](#fbsimsearchnet-power-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|-----|-----| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |final|**-0.691**|[0.0024](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_power.png) |[0.0023](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_power.png) |[0.0016](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_power.png) |[0.0017](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_power.png) |[0.0094](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_power.png)|-| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |final|**-0.648**|[0.0041](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_power.png) |[0.0022](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_power.png) |[0.0048](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_power.png) |[0.0049](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_power.png) |[0.0446](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_power.png)|-| -| 3|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |final|**-0.594**|[0.0002](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_power.png) |[0.0003](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_power.png) |[0.0004](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_power.png) |[0.0002](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_power.png) |-|-| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |final|**-0.513**|[0.0337](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_power.png) |[0.0341](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_power.png) |[0.0236](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_power.png) |[0.0230](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_power.png) |[0.1242](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_power.png)|[0.0469](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_power.png)| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|[0.1117](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_power.png) |[0.1576](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_power.png) |[0.1743](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_power.png) |[0.1520](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_power.png) |[0.1128](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_power.png)|[0.0904](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_power.png)| -| 6|[-](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|-|- |-|**-**|- |- |- |- |-|-| - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -#### Cost Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-cost-rankings)|[BigANN](#bigann-cost-rankings)|[MSTuring](#msturing-cost-rankings)|[MSSpace](#msspace-cost-rankings)|[Text2Image](#text2image-cost-rankings)|[FBSSNet](#fbsimsearchnet-cost-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|--------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |final|**$-3,978,198.83**|$16,086.82 |$15,439.92 |$16,347.45 |$16,382.81 |$103,599.49 |- | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |final|**$-2,339,919.09\*\***|$300,843.83 |$300,815.92 |$150,563.49 |$150,605.68 |$903,307.30 |- | -| 3|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |final|**$-2,272,942.67\*\***|$150,082.04 |$150,088.58 |$150,127.39 |$150,078.78 |- |- | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |final|**$-907,570.13**|$569,058.09 |$569,210.35 |$286,911.87 |$398,163.18 |$1,213,773.56 |$629,442.91 | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|$545,633.16 |$737,886.17 |$853,857.46 |$735,942.66 |$1,272,735.86 |$428,074.79 | -| 6|[-](-)|-|- |-|**-**|- |- |- |- |- |- | - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -### Rankings Per Database - -#### Deep1B - -##### Deep1B Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.99882](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_recall.png)**| -| 2|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[0.99821](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/deep-1B_recall.png)**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.99541](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_recall.png)**| -| 4|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.99504](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_recall.png)**| -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.99208](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_recall.png)**| -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.94275](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_recall.png)**| - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Deep1B Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[816,807](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_throughput.png)**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[196,546](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_throughput.png)**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[91,938](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_throughput.png)**| -| 4|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[12,927](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/deep-1B_throughput.png)**| -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[10,704](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_throughput.png)**| -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[4,464](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_throughput.png)**| - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Deep1B Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.0002](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_power.png)**| -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.0024](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_power.png)**| -| 3|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.0041](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_power.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.0337](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_power.png)**| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1117](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_power.png)**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Deep1B Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|---------|-----------------------|--------|-------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |final|**$16,086.82** |$14,664.20|$1,422.62|$14,664.20 |1 |14,226.208| -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia |NVidia GPU |final|**$150,082.04\*\*** |$150,000.00|$82.04|$150,000.00 |1 |820.405| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia |NVidia GPU |final|**$300,843.83\*\*** |$300,000.00|$843.83|$150,000.00 |2 |8,438.315| -| 4|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$545,633.16** |$506,503.70|$39,129.46|$22,021.90 |23 |391,294.584| -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |final|**$569,058.09** |$557,266.60|$11,791.49|$55,726.66 |10 |117,914.908| -| 6|[-](-)|- |- |-|**-** |-|-|- |- |-| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### BigANN - -##### BigANN Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.99978](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_recall.png)** | -| 2|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[0.99976](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/bigann-1B_recall.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.99882](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_recall.png)** | -| 4|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.99815](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_recall.png)** | -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.99328](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_recall.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.93260](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_recall.png)** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### BigANN Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[767,653](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[335,991](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_throughput.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[85,446](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_throughput.png)** | -| 4|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[19,094](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/bigann-1B_throughput.png)** | -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[10,672](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_throughput.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[3,271](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_throughput.png)** | - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### BigANN Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.0003](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_power.png)**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.0022](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_power.png)**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.0023](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_power.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.0341](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_power.png)**| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1576](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_power.png)**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### BigANN Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|--------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |final|**$15,439.92** |$14,664.20|$775.72|$14,664.20 |1 |7,757.221| -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia |NVidia GPU |final|**$150,088.58\*\*** |$150,000.00|$88.58|$150,000.00 |1 |885.770| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia |NVidia GPU |final|**$300,815.92\*\*** |$300,000.00|$815.92|$150,000.00 |2 |8,159.226| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |final|**$569,210.35** |$557,266.60|$11,943.75|$55,726.66 |10 |119,437.537| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$737,886.17** |$682,678.90|$55,207.27|$22,021.90 |31 |552,072.703| -| 6|[-](-)|- |- |-|**-** |-|-|- |- |-| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### MSTuring - -##### MSTuring Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|---------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.99568](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_recall.png)** | -| 2|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[0.99444](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msturing-1B_recall.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.98993](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_recall.png)** | -| 4|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.98399](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_recall.png)** | -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.97841](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_recall.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.91322](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_recall.png)** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSTuring Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[586,722](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[161,463](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_throughput.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[110,830](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_throughput.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[21,780](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_throughput.png)** | -| 5|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[17,201](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msturing-1B_throughput.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[2,845](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_throughput.png)** | - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSTuring Power Rankings - -|Rank|Submission |Team |Hardware |Status|W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|------|--------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.0004](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_power.png)** | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.0016](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_power.png)** | -| 3|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.0048](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_power.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.0236](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_power.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1743](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_power.png)** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSTuring Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|------------------------------------|------------------------------|-----------------------|--------|--------------|--------|--------|---------|--------------|----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**$16,347.45** |$14,664.20|$1,683.25|$14,664.20 |1 |16,832.451 | -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**$150,127.39\*\*** |$150,000.00|$127.39|$150,000.00 |1 |1,273.870 | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**$150,563.49\*\*** |$150,000.00|$563.49|$150,000.00 |1 |5,634.885 | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**$286,911.87** |$278,633.30|$8,278.57|$55,726.66 |5 |82,785.683 | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**$853,857.46** |$792,788.40|$61,069.06|$22,021.90 |36 |610,690.611 | -| 6|[-](-) |- |- |-|**-** |-|-|- |- |- | - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### MSSpace - -##### MSSpace Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.99835](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_recall.png)** | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.99428](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_recall.png)** | -| 3|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[0.99342](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msspacev-1B_recall.png)** | -| 4|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.98785](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_recall.png)** | -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.98622](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_recall.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |$MS6r_ST|**[0.90853](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_recall.png)** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSSpace Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[844,287](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[157,828](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_throughput.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[109,621](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_throughput.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[16,422](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_throughput.png)** | -| 5|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[6,503](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msspacev-1B_throughput.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[3,265](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_throughput.png)** | - -* The operational point for ranking is 0.9 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.9 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSSpace Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.0002](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_power.png)** | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.0017](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_power.png)** | -| 3|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.0049](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_power.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.0230](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_power.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1520](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_power.png)** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.9 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSSpace Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|-----------------------|------- |--------------|--------|--------|---------|--------------|----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |final|**$16,382.81** |$14,664.20|$1,718.61|$14,664.20 |1 |17,186.056 | -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia |NVidia GPU |final|**$150,078.78\*\*** |$150,000.00|$78.78|$150,000.00 |1 |787.774 | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia |NVidia GPU |final|**$150,605.68\*\*** |$150,000.00|$605.68|$150,000.00 |1 |6,056.841 | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |final|**$398,163.18** |$390,086.62|$8,076.56|$55,726.66 |7 |80,765.638 | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$735,942.66** |$682,678.90|$53,263.76|$22,021.90 |31 |532,637.584 | -| 6|[-](-)|- |- |-|**-** |-|-|- |- |- | - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### Text2Image - -##### Text2Image Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[0.98130](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/text2image-1B_recall.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.97340](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_recall.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.94691](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_recall.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.92855](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_recall.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.86028](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_recall.png)** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Text2Image Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[19,340](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[17,063](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_throughput.png)** | -| 3|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[9,307](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/text2image-1B_throughput.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[4,838](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_throughput.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[1,789](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_throughput.png)** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.860 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.860 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Text2Image Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.0094](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_power.png)**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.0446](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_power.png)**| -| 3|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1128](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_power.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.1242](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_power.png)**| -| 5|[-](-) |- |- |-|**-**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.86 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.86 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Text2Image Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|---------------------|------------------------------|---------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**$103,599.49** |$87,985.20|$15,614.29|$14,664.20 |6 |156,142.873| -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**$903,307.30\*\*** |$900,000.00|$3,307.30|$150,000.00 |6 |33,072.963| -| 3|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**$1,213,773.56** |$1,170,259.86|$43,513.70|$55,726.66 |21 |435,137.010| -| 4|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**$1,272,735.86** |$1,233,226.40|$39,509.46|$22,021.90 |56 |395,094.625| -| 5|[-](-) |- |- |-|**-** |-|-|- |- |-| -| 6|[-](-) |- |- |-|**-** |-|-|- |- |-| - -* The operational point for ranking is 0.86 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.86 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### FBSimSearchNet - -##### FBSimSearchNet AP Rankings - -|Rank|Submission |Team |Hardware |Status |AP | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.99684](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_recall.png)** | -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.97863](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_recall.png)** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### FBSimSearchNet Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[9,345](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_throughput.png)** | -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[5,699](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_throughput.png)** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.9 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.9 average precision. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - - -##### FBSimSearchNet Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.0469](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_power.png)**| -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.0904](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_power.png)**| -| 3|[-](-) |- |- |-|**-**| -| 4|[-](-) |- |- |-|**-**| -| 5|[-](-) |- |- |-|**-**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.9 average precision. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### FBSimSearchNet Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|---------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$428,074.79** |$396,394.20|$31,680.59|$22,021.90 |18 |316,805.859| -| 2|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |final|**$629,442.91** |$612,993.26|$16,449.65|$55,726.66 |11 |164,496.451| -| 3|[-](-)|- |- |-|**-** | -| -| -| -| -| -| 4|[-](-)|- |- |-|**-** | -| -| -| -| -| - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.9 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. diff --git a/t3/LB_history/Dec.2.2021/LEADERBOARDS_REJECT_ANOMALIES.md b/t3/LB_history/Dec.2.2021/LEADERBOARDS_REJECT_ANOMALIES.md deleted file mode 100644 index ab8ce9cef..000000000 --- a/t3/LB_history/Dec.2.2021/LEADERBOARDS_REJECT_ANOMALIES.md +++ /dev/null @@ -1,571 +0,0 @@ -# T3 Track Leaderboards After Rejecting Anomalies (Unofficial) - -Please note that all rankings are currently unofficial due to the following reasons: -* All [open tasks and issues](TASKS_ISSUES_RESOLUTIONS.md) must be resolved. - -## Final Rankings On Private Query Set - -*Not yet available* - -## Rankings On Public Query Set - -### Rankings By Submission Name (alphabetical) - -|Submission |Team |Hardware |[Recall Rank](#recall-or-ap-rankings)|[Thru-put Rank](#throughput-rankings)|[Power Rank](#power-rankings)|[Cost Rank](#cost-rankings)|Status |Anomalies|Evaluator|Algo |Runs | -|--------------------|-----------|----------|---------|---------|---------|--------|---------|---------|---------|---------|--------| -|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |[1](#recall-or-ap-rankings) |[5](#throughput-rankings) |*NQ* |*NQ* |final |*NA* |Harsha Simhadri |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/diskann-t2.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/EvalPublic.ipynb) | -|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |[6](#recall-or-ap-rankings) |[6](#throughput-rankings) |[5](#power-rankings) |[5](#cost-rankings) |final |0/58 |George Williams |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/faiss_t3.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/EvalPublic.ipynb) | -|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |[4](#recall-or-ap-rankings) |[4](#throughput-rankings) |[4](#power-rankings) |[4](#cost-rankings) |final |0/60 |George Williams |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/gemini.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/EvalPublic.ipynb) | -|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |[3](#recall-or-ap-rankings) |[3](#throughput-rankings) |[1](#power-rankings) |[2](#cost-rankings)\*\* |final |[5/50](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/ANOMALIES.md) |George Williams |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/cuanns_ivfpq.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/EvalPublic.ipynb) | -|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |[5](#recall-or-ap-rankings) |[1](#throughput-rankings) |[3](#power-rankings) |[3](#cost-rankings)\*\* |final |[4/40](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/ANOMALIES.md) |George Williams |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/cuanns_multigpu.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/EvalPublic.ipynb) | -|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |[2](#recall-or-ap-rankings) |[2](#throughput-rankings) |[2](#power-rankings) |[1](#cost-rankings)|final |[5/50](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/ANOMALIES.md) |George Williams |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/graphann.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/EvalPublic.ipynb)| - -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - * *NQ* = not qualified - * *NA* = data is not yet available, or has not yet been processed - -* *Anomalies* are defined as queries that could potentially be the result of query response caching, a violation of the competition. Our detection method looks for a 30% or more improvement in the batch query latency between the first and last query of a query group (5). Participants have been given a chance to explain why detected anomalies (if any) are not a result of query response caching. - -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -### Rankings Per Metric - -#### Recall Or AP Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-recall-rankings)|[BigANN](#bigann-recall-rankings)|[MSTuring](#msturing-recall-rankings)|[MSSpace](#msspace-recall-rankings)|[Text2Image](#text2image-recall-rankings)|[FBSSNet](#fbsimsearchnet-ap-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|-------| -| 1|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md)|Microsoft Research India(*org*)|Dell PowerEdge |final|**0.410**|[0.99821](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/deep-1B_recall.png) |[0.99976](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/bigann-1B_recall.png) |[0.99444](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msturing-1B_recall.png) |[0.99342](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msspacev-1B_recall.png) |[0.98130](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/text2image-1B_recall.png) |- | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |final|**0.409**|[0.99882](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_recall.png) |[0.99978](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_recall.png) |[0.99568](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_recall.png) |[0.99835](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_recall.png) |[0.97340](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_recall.png) |- | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |final|**0.368**|[0.99541](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_recall.png) |[0.99882](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_recall.png) |[0.98993](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_recall.png) |[0.99428](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_recall.png) |[0.94691](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_recall.png) |- | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |final|**0.339**|[0.99208](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_recall.png) |[0.99328](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_recall.png) |[0.97841](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_recall.png) |[0.98622](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_recall.png) |[0.92855](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_recall.png) |[0.99684](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_recall.png) | -| 5|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |final|**0.166**|[0.95736](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_recall.png) |[0.96750](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_recall.png) |[0.96286](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_recall.png) |[0.97541](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_recall.png) |- |- | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|[0.94275](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_recall.png) |[0.93260](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_recall.png) |[0.91322](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_recall.png) |[0.90853](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_recall.png) |[0.86028](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_recall.png) |[0.97863](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_recall.png) | - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -#### Throughput Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-throughput-rankings)|[BigANN](#bigann-throughput-rankings)|[MSTuring](#msturing-throughput-rankings)|[MSSpace](#msspace-throughput-rankings)|[Text2Image](#text2image-throughput-rankings)|[FBSSNet](#fbsimsearchnet-throughput-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|--------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |final|**3001623.821**|[816,807](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_throughput.png) |[767,653](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_throughput.png) |[586,722](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_throughput.png) |[844,287](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_throughput.png) |- |- | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |final|**851327.044**|[196,546](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_throughput.png) |[335,991](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_throughput.png) |[161,463](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_throughput.png) |[155,899](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_throughput.png) |[17,063](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_throughput.png) |- | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |final|**401541.475**|[91,938](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_throughput.png) |[85,446](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_throughput.png) |[110,830](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_throughput.png) |[109,621](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_throughput.png) |[19,340](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_throughput.png) |- | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |final|**52429.395**|[10,704](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_throughput.png) |[10,672](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_throughput.png) |[21,780](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_throughput.png) |[16,422](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_throughput.png) |[4,838](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_throughput.png) |[9,345](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_throughput.png) | -| 5|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md)|Microsoft Research India(*org*)|Dell PowerEdge |final|**49398.127**|[12,927](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/deep-1B_throughput.png) |[19,094](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/bigann-1B_throughput.png) |[17,201](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msturing-1B_throughput.png) |[6,503](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msspacev-1B_throughput.png) |[9,307](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/text2image-1B_throughput.png) |- | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|[4,464](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_throughput.png) |[3,271](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_throughput.png) |[2,845](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_throughput.png) |[3,265](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_throughput.png) |[1,789](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_throughput.png) |[5,699](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_throughput.png) | - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -#### Power Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-power-rankings)|[BigANN](#bigann-power-rankings)|[MSTuring](#msturing-power-rankings)|[MSSpace](#msspace-power-rankings)|[Text2Image](#text2image-power-rankings)|[FBSSNet](#fbsimsearchnet-power-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|-----|-----| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |final|**-0.691**|[0.0024](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_power.png) |[0.0023](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_power.png) |[0.0016](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_power.png) |[0.0017](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_power.png) |[0.0094](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_power.png)|-| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |final|**-0.648**|[0.0041](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_power.png) |[0.0022](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_power.png) |[0.0048](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_power.png) |[0.0050](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_power.png) |[0.0446](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_power.png)|-| -| 3|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |final|**-0.594**|[0.0002](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_power.png) |[0.0003](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_power.png) |[0.0004](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_power.png) |[0.0002](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_power.png) |-|-| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |final|**-0.513**|[0.0337](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_power.png) |[0.0341](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_power.png) |[0.0236](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_power.png) |[0.0230](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_power.png) |[0.1242](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_power.png)|[0.0469](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_power.png)| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|[0.1117](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_power.png) |[0.1576](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_power.png) |[0.1743](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_power.png) |[0.1520](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_power.png) |[0.1128](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_power.png)|[0.0904](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_power.png)| -| 6|[-](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|-|- |-|**-**|- |- |- |- |-|-| - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -#### Cost Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-cost-rankings)|[BigANN](#bigann-cost-rankings)|[MSTuring](#msturing-cost-rankings)|[MSSpace](#msspace-cost-rankings)|[Text2Image](#text2image-cost-rankings)|[FBSSNet](#fbsimsearchnet-cost-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|--------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |final|**$-3,978,172.56**|$16,086.82 |$15,439.92 |$16,347.45 |$16,409.08 |$103,599.49 |- | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |final|**$-2,339,919.09\*\***|$300,843.83 |$300,815.92 |$150,563.49 |$150,605.68 |$903,307.30 |- | -| 3|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |final|**$-2,272,942.67\*\***|$150,082.04 |$150,088.58 |$150,127.39 |$150,078.78 |- |- | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |final|**$-907,570.13**|$569,058.09 |$569,210.35 |$286,911.87 |$398,163.18 |$1,213,773.56 |$629,442.91 | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|$545,633.16 |$737,886.17 |$853,857.46 |$735,942.66 |$1,272,735.86 |$428,074.79 | -| 6|[-](-)|-|- |-|**-**|- |- |- |- |- |- | - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -### Rankings Per Database - -#### Deep1B - -##### Deep1B Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.99882](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_recall.png)**| -| 2|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[0.99821](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/deep-1B_recall.png)**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.99541](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_recall.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.99208](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_recall.png)**| -| 5|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.95736](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_recall.png)**| -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.94275](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_recall.png)**| - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Deep1B Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[816,807](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_throughput.png)**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[196,546](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_throughput.png)**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[91,938](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_throughput.png)**| -| 4|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[12,927](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/deep-1B_throughput.png)**| -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[10,704](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_throughput.png)**| -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[4,464](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_throughput.png)**| - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Deep1B Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.0002](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_power.png)**| -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.0024](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_power.png)**| -| 3|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.0041](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_power.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.0337](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_power.png)**| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1117](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_power.png)**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Deep1B Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|---------|-----------------------|--------|-------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |final|**$16,086.82** |$14,664.20|$1,422.62|$14,664.20 |1 |14,226.208| -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia |NVidia GPU |final|**$150,082.04\*\*** |$150,000.00|$82.04|$150,000.00 |1 |820.405| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia |NVidia GPU |final|**$300,843.83\*\*** |$300,000.00|$843.83|$150,000.00 |2 |8,438.315| -| 4|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$545,633.16** |$506,503.70|$39,129.46|$22,021.90 |23 |391,294.584| -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |final|**$569,058.09** |$557,266.60|$11,791.49|$55,726.66 |10 |117,914.908| -| 6|[-](-)|- |- |-|**-** |-|-|- |- |-| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### BigANN - -##### BigANN Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.99978](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_recall.png)** | -| 2|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[0.99976](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/bigann-1B_recall.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.99882](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_recall.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.99328](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_recall.png)** | -| 5|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.96750](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_recall.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.93260](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_recall.png)** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### BigANN Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[767,653](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[335,991](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_throughput.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[85,446](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_throughput.png)** | -| 4|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[19,094](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/bigann-1B_throughput.png)** | -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[10,672](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_throughput.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[3,271](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_throughput.png)** | - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### BigANN Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.0003](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_power.png)**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.0022](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_power.png)**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.0023](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_power.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.0341](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_power.png)**| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1576](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_power.png)**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### BigANN Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|--------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |final|**$15,439.92** |$14,664.20|$775.72|$14,664.20 |1 |7,757.221| -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia |NVidia GPU |final|**$150,088.58\*\*** |$150,000.00|$88.58|$150,000.00 |1 |885.770| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia |NVidia GPU |final|**$300,815.92\*\*** |$300,000.00|$815.92|$150,000.00 |2 |8,159.226| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |final|**$569,210.35** |$557,266.60|$11,943.75|$55,726.66 |10 |119,437.537| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$737,886.17** |$682,678.90|$55,207.27|$22,021.90 |31 |552,072.703| -| 6|[-](-)|- |- |-|**-** |-|-|- |- |-| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### MSTuring - -##### MSTuring Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|---------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.99568](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_recall.png)** | -| 2|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[0.99444](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msturing-1B_recall.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.98993](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_recall.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.97841](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_recall.png)** | -| 5|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.96286](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_recall.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.91322](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_recall.png)** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSTuring Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[586,722](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[161,463](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_throughput.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[110,830](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_throughput.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[21,780](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_throughput.png)** | -| 5|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[17,201](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msturing-1B_throughput.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[2,845](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_throughput.png)** | - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSTuring Power Rankings - -|Rank|Submission |Team |Hardware |Status|W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|------|--------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.0004](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_power.png)** | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.0016](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_power.png)** | -| 3|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.0048](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_power.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.0236](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_power.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1743](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_power.png)** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSTuring Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|------------------------------------|------------------------------|-----------------------|--------|--------------|--------|--------|---------|--------------|----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**$16,347.45** |$14,664.20|$1,683.25|$14,664.20 |1 |16,832.451 | -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**$150,127.39\*\*** |$150,000.00|$127.39|$150,000.00 |1 |1,273.870 | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**$150,563.49\*\*** |$150,000.00|$563.49|$150,000.00 |1 |5,634.885 | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**$286,911.87** |$278,633.30|$8,278.57|$55,726.66 |5 |82,785.683 | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**$853,857.46** |$792,788.40|$61,069.06|$22,021.90 |36 |610,690.611 | -| 6|[-](-) |- |- |-|**-** |-|-|- |- |- | - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### MSSpace - -##### MSSpace Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.99835](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_recall.png)** | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.99428](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_recall.png)** | -| 3|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[0.99342](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msspacev-1B_recall.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.98622](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_recall.png)** | -| 5|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.97541](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_recall.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |$MS6r_ST|**[0.90853](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_recall.png)** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSSpace Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[844,287](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[155,899](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_throughput.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[109,621](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_throughput.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[16,422](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_throughput.png)** | -| 5|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[6,503](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msspacev-1B_throughput.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[3,265](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_throughput.png)** | - -* The operational point for ranking is 0.9 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.9 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSSpace Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.0002](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_power.png)** | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.0017](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_power.png)** | -| 3|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.0050](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_power.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.0230](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_power.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1520](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_power.png)** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.9 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSSpace Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|-----------------------|------- |--------------|--------|--------|---------|--------------|----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |final|**$16,409.08** |$14,664.20|$1,744.88|$14,664.20 |1 |17,448.764 | -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia |NVidia GPU |final|**$150,078.78\*\*** |$150,000.00|$78.78|$150,000.00 |1 |787.774 | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia |NVidia GPU |final|**$150,605.68\*\*** |$150,000.00|$605.68|$150,000.00 |1 |6,056.841 | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |final|**$398,163.18** |$390,086.62|$8,076.56|$55,726.66 |7 |80,765.638 | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$735,942.66** |$682,678.90|$53,263.76|$22,021.90 |31 |532,637.584 | -| 6|[-](-)|- |- |-|**-** |-|-|- |- |- | - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### Text2Image - -##### Text2Image Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[0.98130](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/text2image-1B_recall.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.97340](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_recall.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.94691](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_recall.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.92855](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_recall.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.86028](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_recall.png)** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Text2Image Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[19,340](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[17,063](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_throughput.png)** | -| 3|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[9,307](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/text2image-1B_throughput.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[4,838](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_throughput.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[1,789](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_throughput.png)** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.860 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.860 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Text2Image Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.0094](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_power.png)**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.0446](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_power.png)**| -| 3|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1128](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_power.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.1242](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_power.png)**| -| 5|[-](-) |- |- |-|**-**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.86 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.86 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Text2Image Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|---------------------|------------------------------|---------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**$103,599.49** |$87,985.20|$15,614.29|$14,664.20 |6 |156,142.873| -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**$903,307.30\*\*** |$900,000.00|$3,307.30|$150,000.00 |6 |33,072.963| -| 3|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**$1,213,773.56** |$1,170,259.86|$43,513.70|$55,726.66 |21 |435,137.010| -| 4|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**$1,272,735.86** |$1,233,226.40|$39,509.46|$22,021.90 |56 |395,094.625| -| 5|[-](-) |- |- |-|**-** |-|-|- |- |-| -| 6|[-](-) |- |- |-|**-** |-|-|- |- |-| - -* The operational point for ranking is 0.86 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.86 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### FBSimSearchNet - -##### FBSimSearchNet AP Rankings - -|Rank|Submission |Team |Hardware |Status |AP | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.99684](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_recall.png)** | -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.97863](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_recall.png)** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### FBSimSearchNet Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[9,345](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_throughput.png)** | -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[5,699](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_throughput.png)** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.9 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.9 average precision. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - - -##### FBSimSearchNet Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.0469](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_power.png)**| -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.0904](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_power.png)**| -| 3|[-](-) |- |- |-|**-**| -| 4|[-](-) |- |- |-|**-**| -| 5|[-](-) |- |- |-|**-**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.9 average precision. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### FBSimSearchNet Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|---------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$428,074.79** |$396,394.20|$31,680.59|$22,021.90 |18 |316,805.859| -| 2|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |final|**$629,442.91** |$612,993.26|$16,449.65|$55,726.66 |11 |164,496.451| -| 3|[-](-)|- |- |-|**-** | -| -| -| -| -| -| 4|[-](-)|- |- |-|**-** | -| -| -| -| -| - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.9 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. diff --git a/t3/LB_history/Nov.29.2021/LEADERBOARDS.md b/t3/LB_history/Nov.29.2021/LEADERBOARDS.md deleted file mode 100644 index ec4cc12f8..000000000 --- a/t3/LB_history/Nov.29.2021/LEADERBOARDS.md +++ /dev/null @@ -1,680 +0,0 @@ -# T3 Track Leaderboards (Unofficial) - -Please note that all rankings are currently unofficial due to the following reasons: -* We continue to take changes to algorithms and indexes until Dec 1, so scores and rankings are still subject to change. -* All [open tasks and issues](TASKS_ISSUES_RESOLUTIONS.md) must be resolved. - -## Final Rankings On Private Query Set - -*Not yet available* - -## Rankings On Public Query Set - -### Rankings By Submission Name (alphabetical) - -|Submission |Team |Hardware |Status |Evaluator|Algo |Runs |[Recall Rank](#recall-or-ap-rankings)|[Thru-put Rank](#throughput-rankings)|[Power Rank](#power-rankings)|[Cost Rank](#cost-rankings)| -|--------------------|-----------|----------|-------|---------|---------|--------|---------|--------------|-----------------------------|---------------------------| -|deepgram |DeepGram |NVidia GPU|final | -| -| -| *NQ*| *NQ*| *NQ*| *NQ*| -|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research(*org*) |Dell PowerEdge |inprog |Harsha Simhadri |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/diskann-t2.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/EvalPublic.ipynb) |[1](#recall-or-ap-rankings) |[4](#throughput-rankings) |*NQ* |*NQ* | -|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final |George Williams |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/faiss_t3.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/EvalPublic.ipynb) |[6](#recall-or-ap-rankings) |[6](#throughput-rankings) |[5](#power-rankings) |[2](#cost-rankings) | -|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |inprog |George Williams |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/gemini.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/EvalPublic.ipynb) |[3](#recall-or-ap-rankings) |[5](#throughput-rankings) |[4](#power-rankings) |[3](#cost-rankings) | -|kanndi |Silo.ai |LedaE APU |inprog | -| -| -| -| -| -| -| -|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |inprog |George Williams |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/cuanns_ivfpq.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/EvalPublic.ipynb) |[2](#recall-or-ap-rankings) |[3](#throughput-rankings) |[1](#power-rankings) |*NQ* | -|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |inprog |George Williams |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/cuanns_multigpu.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/EvalPublic.ipynb) |[5](#recall-or-ap-rankings) |[1](#throughput-rankings) |[3](#power-rankings) |*NQ* | -|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |inprog|George Williams |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/graphann.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/EvalPublic.ipynb)|[4](#recall-or-ap-rankings) |[2](#throughput-rankings) |[2](#power-rankings) |[1](#cost-rankings) | -|optanne_graphann_2 |Intel |Intel Optane |inprog | -| -| -| -| -| -| -| -|vector_t3 |Vector Inst|NVidia GPU|final | -| -| -| *NQ*| *NQ*| *NQ*| *NQ*| - -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - * *NQ* = not qualified - -### Rankings Per Metric - -#### Recall Or AP Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-recall-rankings)|[BigANN](#bigann-recall-rankings)|[MSTuring](#msturing-recall-rankings)|[MSSpace](#msspace-recall-rankings)|[Text2Image](#text2image-recall-rankings)|[FBSSNet](#fbsimsearchnet-ap-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|-------| -| 1|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md)|Microsoft Research(*org*)|Dell PowerEdge |inprog|**0.420**|[0.99821](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/deep-1B_recall.png) |[0.99976](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/bigann-1B_recall.png) |[0.99444](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msturing-1B_recall.png) |[0.99342](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msspacev-1B_recall.png) |[0.98130](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/text2image-1B_recall.png) |- | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |inprog|**0.373**|[0.99542](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_recall.png) |[0.99882](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_recall.png) |[0.98993](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_recall.png) |[0.99428](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_recall.png) |[0.94136](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_recall.png) |- | -| 3|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |inprog|**0.296**|[0.98871](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_recall.png) |[0.99253](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_recall.png) |[0.97841](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_recall.png) |[0.98622](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_recall.png) |[0.88585](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_recall.png) |[0.99053](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_recall.png) | -| 4|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |inprog|**0.279**|[0.98264](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_recall.png) |[0.99084](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_recall.png) |[0.96218](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_recall.png) |[0.98791](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_recall.png) |[0.90277](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_recall.png) |- | -| 5|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |inprog|**0.278**|[0.99504](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_recall.png) |[0.99815](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_recall.png) |[0.98399](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_recall.png) |[0.98785](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_recall.png) |- |- | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|[0.94275](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_recall.png) |[0.92671](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_recall.png) |[0.90900](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_recall.png) |[0.90853](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_recall.png) |[0.86028](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_recall.png) |[0.97863](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_recall.png) | -| 7| -| -| -| -| -| -| -| -| -| -| -| -| 8| -| -| -| -| -| -| -| -| -| -| -| -| 9| -| -| -| -| -| -| -| -| -| -| -| -| 10| -| -| -| -| -| -| -| -| -| -| -| - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -#### Throughput Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-throughput-rankings)|[BigANN](#bigann-throughput-rankings)|[MSTuring](#msturing-throughput-rankings)|[MSSpace](#msspace-throughput-rankings)|[Text2Image](#text2image-throughput-rankings)|[FBSSNet](#fbsimsearchnet-throughput-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|--------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |inprog|**2983752.533**|[805,064.205](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_throughput.png) |[771,493.948](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_throughput.png) |[578,677.940](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_throughput.png) |[841,150.465](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_throughput.png) |- |- | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |inprog|**821550.201**|[184,490.708](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_throughput.png) |[343,727.791](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_throughput.png) |[157,277.710](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_throughput.png) |[139,612.021](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_throughput.png) |[10,838.358](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_throughput.png) |- | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |inprog|**397623.802**|[97,268.471](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_throughput.png) |[84,367.141](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_throughput.png) |[111,580.136](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_throughput.png) |[109,555.059](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_throughput.png) |[9,249.383](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_throughput.png) |- | -| 4|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md)|Microsoft Research(*org*)|Dell PowerEdge |inprog|**50635.296**|[12,926.890](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/deep-1B_throughput.png) |[19,094.371](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/bigann-1B_throughput.png) |[17,200.601](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msturing-1B_throughput.png) |[6,503.212](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msspacev-1B_throughput.png) |[9,306.610](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/text2image-1B_throughput.png) |- | -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |inprog|**37428.363**|[9,150.271](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_throughput.png) |[9,504.865](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_throughput.png) |[20,166.678](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_throughput.png) |[8,587.024](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_throughput.png) |[1,864.634](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_throughput.png) |[8,123.552](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_throughput.png) | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|[4,417.036](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_throughput.png) |[3,086.656](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_throughput.png) |[2,359.485](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_throughput.png) |[2,770.848](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_throughput.png) |[1,762.363](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_throughput.png) |[5,572.272](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_throughput.png) | -| 7| -| -| -| -| -| -| -| -| -| -| -| -| 8| -| -| -| -| -| -| -| -| -| -| -| -| 9| -| -| -| -| -| -| -| -| -| -| -| -| 10| -| -| -| -| -| -| -| -| -| -| -| - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -#### Power Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-power-rankings)|[BigANN](#bigann-power-rankings)|[MSTuring](#msturing-power-rankings)|[MSSpace](#msspace-power-rankings)|[Text2Image](#text2image-power-rankings)|[FBSSNet](#fbsimsearchnet-power-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|-----|-----| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |inprog|**-0.744**|[0.0023](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_power.png) |[0.0024](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_power.png) |[0.0017](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_power.png) |[0.0017](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_power.png) |[0.0222](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_power.png)|-| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |inprog|**-0.687**|[0.0040](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_power.png) |[0.0021](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_power.png) |[0.0049](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_power.png) |[0.0054](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_power.png) |[0.0702](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_power.png)|-| -| 3|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |inprog|**-0.650**|[0.0002](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_power.png) |[0.0002](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_power.png) |[0.0004](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_power.png) |[0.0002](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_power.png) |-|-| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md)|GSI Technology(*org*)|LedaE APU |inprog|**-0.489**|[0.0398](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_power.png) |[0.0394](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_power.png) |[0.0227](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_power.png) |[0.0485](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_power.png) |[0.1759](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_power.png)|[0.0540](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_power.png)| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|[0.1126](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_power.png) |[0.1671](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_power.png) |[0.2037](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_power.png) |[0.1674](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_power.png) |[0.1233](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_power.png)|[0.0949](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_power.png)| -| 6|[-](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|-|- |-|**-**|- |- |- |- |-|-| -| 7| -| -| -| -| -| -| -| -| -| -| -| -| 8| -| -| -| -| -| -| -| -| -| -| -| -| 9| -| -| -| -| -| -| -| -| -| -| -| -| 10| -| -| -| -| -| -| -| -| -| -| -| - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -#### Cost Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-cost-rankings)|[BigANN](#bigann-cost-rankings)|[MSTuring](#msturing-cost-rankings)|[MSSpace](#msspace-cost-rankings)|[Text2Image](#text2image-cost-rankings)|[FBSSNet](#fbsimsearchnet-cost-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|--------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |inprog|**$-4,285,768.44**|$16,082.49 |$15,407.15 |$16,397.80 |$16,563.61 |$171,244.96 |- | -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|$545,952.10 |$785,282.45 |$1,018,332.30 |$873,460.84 |$1,298,436.77 |$429,634.84 | -| 3|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |inprog|**$1,089,170.96**|$626,932.94 |$626,785.91 |$286,578.81 |$685,704.76 |$3,070,882.16 |$743,385.69 | -| 4|[-](-)|-|- |-|**-**|- |- |- |- |- |- | -| 5|[-](-)|-|- |-|**-**|- |- |- |- |- |- | -| 6|[-](-)|-|- |-|**-**|- |- |- |- |- |- | -| 7| -| -| -| -| -| -| -| -| -| -| -| -| 8| -| -| -| -| -| -| -| -| -| -| -| -| 9| -| -| -| -| -| -| -| -| -| -| -| -| 10| -| -| -| -| -| -| -| -| -| -| -| - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -### Rankings Per Database - -#### Deep1B - -##### Deep1B Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research(*org*) |Dell PowerEdge |inprog|**[0.99821](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/deep-1B_recall.png)**| -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |inprog|**[0.99542](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_recall.png)**| -| 3|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |inprog|**[0.99504](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_recall.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |inprog|**[0.98871](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_recall.png)**| -| 5|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |inprog|**[0.98264](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_recall.png)**| -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.94275](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_recall.png)**| -| 7| -| -| -| -| -| -| 8| -| -| -| -| -| -| 9| -| -| -| -| -| -| 10| -| -| -| -| -| - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Deep1B Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |inprog|**[805,064.205](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_throughput.png)**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |inprog|**[184,490.708](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_throughput.png)**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |inprog|**[97,268.471](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_throughput.png)**| -| 4|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research(*org*) |Dell PowerEdge |inprog|**[12,926.890](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/deep-1B_throughput.png)**| -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |inprog|**[9,150.271](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_throughput.png)**| -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[4,417.036](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_throughput.png)**| -| 7| -| -| -| -| -| -| 8| -| -| -| -| -| -| 9| -| -| -| -| -| -| 10| -| -| -| -| -| - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Deep1B Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |inprog|**[0.0002](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_power.png)**| -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |inprog|**[0.0023](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_power.png)**| -| 3|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |inprog|**[0.0040](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_power.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |inprog|**[0.0398](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_power.png)**| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1126](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_power.png)**| -| 6|[-](-) |- |- |-|**-**| -| 7| -| -| -| -| -| -| 8| -| -| -| -| -| -| 9| -| -| -| -| -| -| 10| -| -| -| -| -| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Deep1B Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|---------|-----------------------|--------|-------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |inprog|**$16,082.49** |$14,664.20|$1,418.29|$14,664.20 |1 |14,182.933| -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$545,952.10** |$506,503.70|$39,448.40|$22,021.90 |23 |394,484.028| -| 3|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |inprog|**$626,932.94** |$612,993.26|$13,939.68|$55,726.66 |11 |139,396.812| -| 4|[-](-)|- |- |-|**-** |-|-|- |- |-| -| 5|[-](-)|- |- |-|**-** |-|-|- |- |-| -| 6|[-](-)|- |- |-|**-** |-|-|- |- |-| -| 6| -| -| -| -| -| -| -| -| -| -| -| 7| -| -| -| -| -| -| -| -| -| -| -| 8| -| -| -| -| -| -| -| -| -| -| -| 9| -| -| -| -| -| -| -| -| -| -| -| 10| -| -| -| -| -| -| -| -| -| -| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -#### BigANN - -##### BigANN Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research(*org*) |Dell PowerEdge |inprog|**[0.99976](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/bigann-1B_recall.png)** | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |inprog|**[0.99882](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_recall.png)** | -| 3|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |inprog|**[0.99815](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_recall.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |inprog|**[0.99253](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_recall.png)** | -| 5|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |inprog|**[0.99084](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_recall.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.92671](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_recall.png)** | -| 7| -| -| -| -| -| -| 8| -| -| -| -| -| -| 9| -| -| -| -| -| -| 10| -| -| -| -| -| - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### BigANN Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |inprog|**[771,493.948](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |inprog|**[343,727.791](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_throughput.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |inprog|**[84,367.141](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_throughput.png)** | -| 4|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research(*org*) |Dell PowerEdge |inprog|**[19,094.371](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/bigann-1B_throughput.png)** | -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |inprog|**[9,504.865](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_throughput.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[3,086.656](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_throughput.png)** | -| 7| -| -| -| -| -| -| 8| -| -| -| -| -| -| 9| -| -| -| -| -| -| 10| -| -| -| -| -| - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### BigANN Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |inprog|**[0.0002](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_power.png)**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |inprog|**[0.0021](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_power.png)**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |inprog|**[0.0024](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_power.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |inprog|**[0.0394](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_power.png)**| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1671](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_power.png)**| -| 6|[-](-) |- |- |-|**-**| -| 7| -| -| -| -| -| -| 8| -| -| -| -| -| -| 9| -| -| -| -| -| -| 10| -| -| -| -| -| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### BigANN Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|--------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |inprog|**$15,407.15** |$14,664.20|$742.95|$14,664.20 |1 |7,429.540| -| 2|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |inprog|**$626,785.91** |$612,993.26|$13,792.65|$55,726.66 |11 |137,926.464| -| 3|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$785,282.45** |$726,722.70|$58,559.75|$22,021.90 |33 |585,597.505| -| 4|[-](-)|- |- |-|**-** |-|-|- |- |-| -| 5|[-](-)|- |- |-|**-** |-|-|- |- |-| -| 6|[-](-)|- |- |-|**-** |-|-|- |- |-| -| 7| -| -| -| -| -| -| -| -| -| -| -| 8| -| -| -| -| -| -| -| -| -| -| -| 9| -| -| -| -| -| -| -| -| -| -| -| 10| -| -| -| -| -| -| -| -| -| -| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -#### MSTuring - -##### MSTuring Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|---------------| -| 1|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research(*org*) |Dell PowerEdge |inprog|**[0.99444](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msturing-1B_recall.png)** | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |inprog|**[0.98993](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_recall.png)** | -| 3|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |inprog|**[0.98399](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_recall.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |inprog|**[0.97841](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_recall.png)** | -| 5|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |inprog|**[0.96218](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_recall.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.90900](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_recall.png)** | -| 7| -| -| -| -| -| -| 8| -| -| -| -| -| -| 9| -| -| -| -| -| -| 10| -| -| -| -| -| - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSTuring Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |inprog|**[578,677.940](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |inprog|**[157,277.710](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_throughput.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |inprog|**[111,580.136](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_throughput.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |inprog|**[20,166.678](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_throughput.png)** | -| 5|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research(*org*) |Dell PowerEdge |inprog|**[17,200.601](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msturing-1B_throughput.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[2,359.485](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_throughput.png)** | -| 7| -| -| -| -| -| -| 8| -| -| -| -| -| -| 9| -| -| -| -| -| -| 10| -| -| -| -| -| - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSTuring Power Rankings - -|Rank|Submission |Team |Hardware |Status|W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|------|--------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |inprog|**[0.0004](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_power.png)** | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |inprog|**[0.0017](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_power.png)** | -| 3|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |inprog|**[0.0049](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_power.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |inprog|**[0.0227](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_power.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.2037](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_power.png)** | -| 6|[-](-) |- |- |-|**-** | -| 7| -| -| -| -| -| -| 8| -| -| -| -| -| -| 9| -| -| -| -| -| -| 10| -| -| -| -| -| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSTuring Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|------------------------------------|------------------------------|-----------------------|--------|--------------|--------|--------|---------|--------------|----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |inprog|**$16,397.80** |$14,664.20|$1,733.60|$14,664.20 |1 |17,335.975 | -| 2|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |inprog|**$286,578.81** |$278,633.30|$7,945.51|$55,726.66 |5 |79,455.069 | -| 3|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**$1,018,332.30** |$946,941.70|$71,390.60|$22,021.90 |43 |713,905.964 | -| 4|[-](-) |- |- |-|**-** |-|-|- |- |- | -| 5|[-](-) |- |- |-|**-** |-|-|- |- |- | -| 6|[-](-) |- |- |-|**-** |-|-|- |- |- | -| 7| -| -| -| -| -| -| -| -| -| -| -| 8| -| -| -| -| -| -| -| -| -| -| -| 9| -| -| -| -| -| -| -| -| -| -| -| 10| -| -| -| -| -| -| -| -| -| -| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -#### MSSpace - -##### MSSpace Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|---------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |inprog|**[0.0002](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_power.png)** | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |inprog|**[0.0017](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_power.png)** | -| 3|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |inprog|**[0.0054](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_power.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |inprog|**[0.0485](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_power.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1674](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_power.png)** | -| 6|[-](-) |- |- |-|**-** | -| 7| -| -| -| -| -| -| 8| -| -| -| -| -| -| 9| -| -| -| -| -| -| 10| -| -| -| -| -| - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSSpace Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |inprog|**[841,150.465](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |inprog|**[139,612.021](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_throughput.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |inprog|**[109,555.059](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_throughput.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |inprog|**[8,587.024](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_throughput.png)** | -| 5|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research(*org*) |Dell PowerEdge |inprog|**[6,503.212](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msspacev-1B_throughput.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[2,770.848](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_throughput.png)** | -| 7| -| -| -| -| -| -| 8| -| -| -| -| -| -| 9| -| -| -| -| -| -| 10| -| -| -| -| -| - -* The operational point for ranking is 0.9 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.9 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSSpace Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |inprog|**[0.0002](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_power.png)** | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |inprog|**[0.0017](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_power.png)** | -| 3|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |inprog|**[0.0054](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_power.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |inprog|**[0.0485](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_power.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1674](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_power.png)** | -| 6|[-](-) |- |- |-|**-** | -| 7| -| -| -| -| -| -| 8| -| -| -| -| -| -| 9| -| -| -| -| -| -| 10| -| -| -| -| -| - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.9 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSSpace Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|-----------------------|------- |--------------|--------|--------|---------|--------------|----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |inprog|**$16,563.61** |$14,664.20|$1,899.41|$14,664.20 |1 |18,994.109 | -| 2|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |inprog|**$685,704.76** |$668,719.92|$16,984.84|$55,726.66 |12 |169,848.419 | -| 3|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$873,460.84** |$814,810.30|$58,650.54|$22,021.90 |37 |586,505.424 | -| 4|[-](-)|- |- |-|**-** |-|-|- |- |- | -| 5|[-](-)|- |- |-|**-** |-|-|- |- |- | -| 6|[-](-)|- |- |-|**-** |-|-|- |- |- | -| 7| -| -| -| -| -| -| -| -| -| -| -| 8| -| -| -| -| -| -| -| -| -| -| -| 9| -| -| -| -| -| -| -| -| -| -| -| 10| -| -| -| -| -| -| -| -| -| -| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -#### Text2Image - -##### Text2Image Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research(*org*) |Dell PowerEdge |inprog|**[0.98130](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/text2image-1B_recall.png)** | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |inprog|**[0.94136](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_recall.png)** | -| 3|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |inprog|**[0.90277](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_recall.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |inprog|**[0.88585](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_recall.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.86028](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_recall.png)** | -| 6|[-](-) |- |- |-|**-** | -| 7| -| -| -| -| -| -| 8| -| -| -| -| -| -| 9| -| -| -| -| -| -| 10| -| -| -| -| -| - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Text2Image Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |inprog|**[10,838.358](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_throughput.png)** | -| 2|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research(*org*) |Dell PowerEdge |inprog|**[9,306.610](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/text2image-1B_throughput.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |inprog|**[9,249.383](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_throughput.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |inprog|**[1,864.634](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_throughput.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[1,762.363](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_throughput.png)** | -| 6|[-](-) |- |- |-|**-** | -| 7| -| -| -| -| -| -| 8| -| -| -| -| -| -| 9| -| -| -| -| -| -| 10| -| -| -| -| -| - -* The operational point for ranking is 0.860 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.860 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Text2Image Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |inprog|**[0.0222](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_power.png)**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |inprog|**[0.0702](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_power.png)**| -| 3|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1233](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_power.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |inprog|**[0.1759](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_power.png)**| -| 5|[-](-) |- |- |-|**-**| -| 6|[-](-) |- |- |-|**-**| -| 6| -| -| -| -| -| -| 7| -| -| -| -| -| -| 8| -| -| -| -| -| -| 9| -| -| -| -| -| -| 10| -| -| -| -| -| - -* The operational point for ranking is 0.86 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.86 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Text2Image Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|---------------------|------------------------------|---------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |inprog|**$171,244.96** |$146,642.00|$24,602.96|$14,664.20 |10 |246,029.624| -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**$1,298,436.77** |$1,255,248.30|$43,188.47|$22,021.90 |57 |431,884.673| -| 3|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |inprog|**$3,070,882.16** |$3,009,239.64|$61,642.52|$55,726.66 |54 |616,425.231| -| 4|[-](-) |- |- |-|**-** |-|-|- |- |-| -| 5|[-](-) |- |- |-|**-** |-|-|- |- |-| -| 6|[-](-) |- |- |-|**-** |-|-|- |- |-| -| 7| -| -| -| -| -| -| -| -| -| -| -| 8| -| -| -| -| -| -| -| -| -| -| -| 9| -| -| -| -| -| -| -| -| -| -| -| 10| -| -| -| -| -| -| -| -| -| -| - -* The operational point for ranking is 0.86 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.86 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -#### FBSimSearchNet - -##### FBSimSearchNet AP Rankings - -|Rank|Submission |Team |Hardware |Status |AP | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |inprog|**[0.99053](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_recall.png)** | -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.97863](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_recall.png)** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | -| 7| -| -| -| -| -| -| 8| -| -| -| -| -| -| 9| -| -| -| -| -| -| 10| -| -| -| -| -| - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### FBSimSearchNet Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |inprog|**[8,123.552](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_throughput.png)** | -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[5,572.272](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_throughput.png)** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | -| 7| -| -| -| -| -| -| 8| -| -| -| -| -| -| 9| -| -| -| -| -| -| 10| -| -| -| -| -| - -* The operational point for ranking is 0.9 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.9 average precision. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - - -##### FBSimSearchNet Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |inprog|**[0.0540](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_power.png)**| -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.0949](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_power.png)**| -| 3|[-](-) |- |- |-|**-**| -| 4|[-](-) |- |- |-|**-**| -| 5|[-](-) |- |- |-|**-**| -| 6|[-](-) |- |- |-|**-**| -| 7| -| -| -| -| -| -| 8| -| -| -| -| -| -| 9| -| -| -| -| -| -| 10| -| -| -| -| -| - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.9 average precision. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### FBSimSearchNet Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|---------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$429,634.84** |$396,394.20|$33,240.64|$22,021.90 |18 |332,406.441| -| 2|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |inprog|**$743,385.69** | -| -| -| -| -| -| 3|[-](-)|- |- |-|**-** | -| -| -| -| -| -| 4|[-](-)|- |- |-|**-** | -| -| -| -| -| -| 5| -| -| -| -| -| -| -| -| -| -| -| 6| -| -| -| -| -| -| -| -| -| -| -| 7| -| -| -| -| -| -| -| -| -| -| -| 8| -| -| -| -| -| -| -| -| -| -| -| 9| -| -| -| -| -| -| -| -| -| -| -| 10| -| -| -| -| -| -| -| -| -| -| - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.9 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - diff --git a/t3/LB_history/Nov.29.2021/TASKS_ISSUES_RESOLUTIONS.md b/t3/LB_history/Nov.29.2021/TASKS_ISSUES_RESOLUTIONS.md deleted file mode 100644 index e9a750712..000000000 --- a/t3/LB_history/Nov.29.2021/TASKS_ISSUES_RESOLUTIONS.md +++ /dev/null @@ -1,42 +0,0 @@ - -# BigANN Challenge T3 Tasks, Issues, and Resolutions - -In the spirit of maintaining a fair and open competition, we will be tracking all important remaining tasks and issues, and their respective resolution - and making that all public here on this README. All competition rankings and winners will be "unofficial" until all tasks and issues have been resolved. - -Participants should send their questions and issues to the T3 organizer directly (gwilliams@gsitechnology.com), or to the competition google group at big-ann-organizers@googlegroups.com. Note that some issues may require a complete re-evaluation of an algorithm on its respective hardware, or may require additional information from a participant or competition organizer(s). - -## Tasks (open) - -* [T3 Organizer to Microsoft] Currently reported DiskANN CSV results is using an old version of recall computation (ie, not accounting for ties and it will likely affect msspacev-1B recall mostly). - * PENDING RESOLUTION: [Microsoft to T3 Organizer] Will re-base and send the CSV. -* [Microsoft to T3 Organizer] Currently, DiskANN cannot qualify for power and cost benchmarks due to issue with running IPMICAP ( python ipmi in particular seems to be the issue. ) - * PENDING RESOLUTION: [T3 Organizer to Microsoft] We will work on local dcmi support in the IPMICAP server. -* [GSI to T3 Organizer] New index for SSNPP and Text2Image requires re-evaluation for those datasets and updated scores. - * PENDING RESOLUTION: [T3 Organizer to GSI] We ran SSNPP to completion, but having issues with Text2Image. -* [T3 Organizer to Microsoft] Need to retrieve "results" h5py files from MS DiskANN remote machine. - -## Issues (open) - -* [Intel asks T3 Organizer] Why won't there be one winner for T3 that combines all individual benchmarks? - * PENDING RESOLUTION: [T3 Organizer to Intel] We have provided the reason. Hopefully its a good enough explanation and we can soon remove this issue. -* [Intel asks T3 Organizer] Why are power and cost rankings optional for a submission? - * PENDING RESOLUTION: [T3 Organizer to Intel] We have provided the reason. Hopefully its a good enough explanation and we can soon remove this issue. -* [GSI to T3 Organizers] We cannot reproduce the baseline performance on SSNPP on same/similar hardware. - * PENDING RESOLUTION: [T3 Organizer to GSI] We've reproduced on sent the results. Please approve. -* [T3 Organizer asks NVidia] Can't we use an MSRP from another company as proxy for system cost? - * PENDING RESOLUTION: [T3 Organizer to NVidia] We will take the cheapest MSRP from third party seller. Please approve. -* [GSI to T3 Organizers] Have you discussed taking power also on the recall working point and not just on the throughput working point? -[GSI asks T3 Organizers] Since some algorithms implement smart caching mechanisms to simulate real life scenarios and since the competition framework sends the same queries again and again 50 time for each dataset (5 runs x 10 query configurations) which is not a real life case. It is important that competition framework needs to verify the results, automatically (and if not possible manually) that no caching mechanism is used in between runs and in between query configurations. One way is to make sure that the throughput for the runs doesn’t differ much taking into account that there are 5 runs and 10 configurations with the same queries. Probably a better way is to send for different queries or somehow cool down the cache in between runs by sending random queries. - * PENDING RESOLUTION: [T3 Organizers to GSI] We will add "cache detection" countermeasure to the framework and reevaulate all submissions. - -## Resolutions - -* [GSI asked] What does NQ mean? - * [T3 Organizer responded] It could mean 1) team did not submit a qualifying algorithm for the benchmark 2) team decided did not participate in that benchmark 3) unable to get some key data for the benchmark (such as power or system cost, or both ). -* [T3 Organizer self-report] Need to retrieve "results" h5py files from NVidia's remote machine. - * Done on 11/23/2021 -* [T3 Organizer to NVidia] Need to retrieve power monitoring "results" h5py files from NVidia's remote machine. - * Done on 11/23/2021 and subsequently on changes to algos.yaml -* [GSI to T3 Organizer] Need better documentation for how to extract power benchmark from plot.py script. - * Answered via email. Basically, you need to supply "wspq" as an explicit metric you want to retrieve using the chosen axis. Run "python ploy.py --help" to get more information. - diff --git a/t3/LEADERBOARDS.md b/t3/LEADERBOARDS.md deleted file mode 100644 index 801c76605..000000000 --- a/t3/LEADERBOARDS.md +++ /dev/null @@ -1,41 +0,0 @@ - -# BigANN Challenge T3 Leaderboards and Winners - -We rank participants based on 4 different but inter-related benchmarks: -* One based on recall/average precision -* One based on throughput -* One based on power consumption -* One based on hardware cost - -We maintain two sets of leaderboards that rank participants on all benchmarks: -* [Leaderboards based on a public query dataset](LEADERBOARDS_PUBLIC.md) in which participants had access during the competition. -* [Leaderboards based on a private query dataet](LEADERBOARDS_PRIVATE.md) in which submissions are currently being evaluated. - -Please consult the main [T3 track README](README.md) for more details about benchmarks and ranking methodology. - -## Public Dataset Leaderboards And Winners - -The leaderboards and rankings on the public dataset set lives [here](LEADERBOARDS_PUBLIC.md). - -We would like to congratulate all the winners of this part of the competition, teams from Intel and NVidia: -* Sourabh Dongaonkar (Intel Corporate) -* Mariano Tepper (Intel Labs) -* Yong Wong (NVidia) -* Akira Naruse (NVidia) -* Jingrong Zhang (NVidia) -* Mahesh Doijade (NVidia) - -We are in the process of resolving the remaining issues and tasks. - -Upon completion, we will make the rankings and winners official. - -Please revisit this page again soon for more updates. - -## Private Dataset Leaderboards Status - -The status of the leaderboards and rankings on the private dataset lives [here](LEADERBOARDS_PRIVATE.md). - -All submissions are currently being evaluated using the private data sets so the scores (and rankings) could change as evaluation proceeds - -Please revisit this page again soon for more updates. - diff --git a/t3/LEADERBOARDS_PRIVATE.md b/t3/LEADERBOARDS_PRIVATE.md deleted file mode 100644 index 5b2a588cc..000000000 --- a/t3/LEADERBOARDS_PRIVATE.md +++ /dev/null @@ -1,566 +0,0 @@ -# T3 Track Private Dataset Leaderboards - -Please note that all rankings and winners are unofficial until all [open tasks and issues](TASKS_ISSUES_RESOLUTIONS.md) are resolved. - -## Rankings By Category - -### Rankings By Submission Name (alphabetical) - -|Submission |Team |Hardware |[Recall Rank](#recall-or-ap-rankings)|[Thru-put Rank](#throughput-rankings)|[Power Rank](#power-rankings)|[Cost Rank](#cost-rankings)|Status |Anomalies|Evaluator|Algo |Runs | -|--------------------|-----------|----------|---------|---------|---------|--------|---------|---------|---------|---------|--------| -|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |*NA* |*NA* |*NA* |*NA* |eval |*NA* |[Harsha Simhadri](https://github.com/harsha-simhadri) |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/diskann-t2.py) |NA | -|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |[5](#recall-or-ap-rankings) |[5](#throughput-rankings) |[5](#power-rankings) |[4](#cost-rankings) |eval |0/49 |[George Williams](https://github.com/sourcesync) |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/faiss_t3.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/EvalPrivate.ipynb) | -|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |[3](#recall-or-ap-rankings) |[4](#throughput-rankings) |[4](#power-rankings) |[5](#cost-rankings) |eval |0/50 |[George Williams](https://github.com/sourcesync) |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/gemini.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/EvalPrivate.ipynb) | -|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |[1](#recall-or-ap-rankings) |[3](#throughput-rankings) |[1](#power-rankings) |[2](#cost-rankings)\*\* |eval |[6/40](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/ANOMALIES.md) |[George Williams](https://github.com/sourcesync) |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/cuanns_ivfpq.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/EvalPrivate.ipynb) | -|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |[4](#recall-or-ap-rankings) |[1](#throughput-rankings) |[3](#power-rankings) |[3](#cost-rankings)\*\* |eval |[3/30](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/ANOMALIES.md) |[George Williams](https://github.com/sourcesync) |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/cuanns_multigpu.py) |NA | -|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |[2](#recall-or-ap-rankings) |[2](#throughput-rankings) |[2](#power-rankings) |[1](#cost-rankings)|eval |[4/40](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/ANOMALIES.md) |[George Williams](https://github.com/sourcesync) |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/graphann.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/EvalPrivate.ipynb)| - -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - * *NQ* = not qualified - * *NA* = data is not yet available, or has not yet been processed - -* *Anomalies* are defined as queries that could potentially be the result of query response caching, a violation of the competition. Our detection method looks for a 30% or more improvement in the batch query latency between the first and last query of a query group (5). Participants have been given a chance to explain why detected anomalies (if any) are not a result of query response caching. In general, our analysis did not uncover this symptom of systematic query response caching from any submission. Also, if we throw out the anomalous data points, the [adjusted leaderboard rankings](LEADERBOARDS_PRIVATE_REJECT_ANOMALIES.md) do not change even though some scores change slightly. - -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -### Rankings Per Benchmark - -#### Recall Or AP Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-recall-rankings)|[BigANN](#bigann-recall-rankings)|[MSTuring](#msturing-recall-rankings)|[MSSpace](#msspace-recall-rankings)|[Text2Image](#text2image-recall-rankings)|[FBSSNet](#fbsimsearchnet-ap-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|-------| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |eval|**0.225**|[0.99541](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_deep-1B_recall.png) |[0.99882](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_bigann-1B_recall.png) |[0.99054](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_msturing-1B_recall.png) |- |[0.63732](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_text2image-1B_recall.png) |- | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |eval|**0.224**|[0.99872](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_deep-1B_recall.png) |[0.99977](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_bigann-1B_recall.png) |[0.99561](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_msturing-1B_recall.png) |- |[0.62692](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_text2image-1B_recall.png) |- | -| 3|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |eval|**0.197**|[0.99185](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_deep-1B_recall.png) |[0.99452](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_bigann-1B_recall.png) |[0.97719](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_msturing-1B_recall.png) |- |[0.61895](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_text2image-1B_recall.png) |[0.99672](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_ssnpp-1B_recall.png) | -| 4|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |eval|**0.182**|[0.99551](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/private_deep-1B_recall.png) |[0.99872](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/private_bigann-1B_recall.png) |[0.98330](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/private_msturing-1B_recall.png) |- |- |- | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |eval|**baseline**|[0.94437](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_deep-1B_recall.png) |[0.93604](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_bigann-1B_recall.png) |[0.91513](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_msturing-1B_recall.png) |- |[0.60105](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_text2image-1B_recall.png) |[0.98567](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_ssnpp-1B_recall.png) | -| 6|[-](-)|-|- |-|**-**|- |- |- |- |- |- | - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -#### Throughput Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-throughput-rankings)|[BigANN](#bigann-throughput-rankings)|[MSTuring](#msturing-throughput-rankings)|[MSSpace](#msspace-throughput-rankings)|[Text2Image](#text2image-throughput-rankings)|[FBSSNet](#fbsimsearchnet-throughput-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|--------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |eval|**2116124**|[968,840](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/private_deep-1B_throughput.png) |[764,700](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/private_bigann-1B_throughput.png) |[393,528](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/private_msturing-1B_throughput.png) |- |- |- | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |eval|**685763**|[210,403](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_deep-1B_throughput.png) |[350,007](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_bigann-1B_throughput.png) |[127,883](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_msturing-1B_throughput.png) |- |[10,364](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_text2image-1B_throughput.png) |- | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |eval|**297608**|[94,042](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_deep-1B_throughput.png) |[84,806](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_bigann-1B_throughput.png) |[110,886](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_msturing-1B_throughput.png) |- |[20,765](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_text2image-1B_throughput.png) |- | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |eval|**30425**|[12,345](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_deep-1B_throughput.png) |[10,868](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_bigann-1B_throughput.png) |[14,862](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_msturing-1B_throughput.png) |- |[2,154](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_text2image-1B_throughput.png) |[9,343](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_ssnpp-1B_throughput.png) | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |eval|**baseline**|[5,035](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_deep-1B_throughput.png) |[3,279](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_bigann-1B_throughput.png) |[2,630](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_msturing-1B_throughput.png) |- |[1,948](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_text2image-1B_throughput.png) |[6,256](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_ssnpp-1B_throughput.png) | -| 6|[-](-)|-|- |-|**-**|- |- |- |- |- |- | - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -#### Power Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-power-rankings)|[BigANN](#bigann-power-rankings)|[MSTuring](#msturing-power-rankings)|[MSSpace](#msspace-power-rankings)|[Text2Image](#text2image-power-rankings)|[FBSSNet](#fbsimsearchnet-power-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|-----|-----| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |eval|**-0.475**|[0.0104](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_deep-1B_power.png) |[0.0119](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_bigann-1B_power.png) |[0.0099](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_msturing-1B_power.png) |- |[0.0441](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_text2image-1B_power.png)|-| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |eval|**-0.469**|[0.0036](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_deep-1B_power.png) |[0.0020](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_bigann-1B_power.png) |[0.0054](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_msturing-1B_power.png) |- |[0.0710](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_text2image-1B_power.png)|-| -| 3|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |eval|**-0.431**|[0.0025](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/private_deep-1B_power.png) |[0.0022](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/private_bigann-1B_power.png) |[0.0061](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/private_msturing-1B_power.png) |- |-|-| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |eval|**-0.232**|[0.0352](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_deep-1B_power.png) |[0.0342](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_bigann-1B_power.png) |[0.0250](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_msturing-1B_power.png) |- |[0.2661](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_text2image-1B_power.png)|[0.0433](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_ssnpp-1B_power.png)| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |eval|**baseline**|[0.0923](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_deep-1B_power.png) |[0.1623](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_bigann-1B_power.png) |[0.1874](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_msturing-1B_power.png) |- |[0.1091](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_text2image-1B_power.png)|[0.0847](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_ssnpp-1B_power.png)| -| 6|[-](-)|-|- |-|**-**|- |- |- |- |-|-| - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -#### Cost Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-cost-rankings)|[BigANN](#bigann-cost-rankings)|[MSTuring](#msturing-cost-rankings)|[MSSpace](#msspace-cost-rankings)|[Text2Image](#text2image-cost-rankings)|[FBSSNet](#fbsimsearchnet-cost-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|--------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |eval|**$-3,100,829.55**|$15,918.69 |$15,372.40 |$16,572.66 |- |$171,523.05 |- | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |eval|**$-1,793,445.89\*\***|$303,647.91 |$304,177.20 |$153,483.45 |- |$765,461.90 |- | -| 3|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |eval|**$-1,683,055.85\*\***|$150,863.29 |$150,786.43 |$152,142.96 |- |- |- | -| 4|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |eval|**baseline**|$472,764.09 |$739,552.84 |$924,531.60 |- |$1,183,367.83 |$382,013.99 | -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |eval|**$1,120,285.77**|$513,869.50 |$569,253.60 |$398,832.13 |- |$2,712,384.33 |$628,176.55 | -| 6|[-](-)|-|- |-|**-**|- |- |- |- |- |- | - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -### Rankings Per Database - -#### Deep1B - -##### Deep1B Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**[0.99872](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_deep-1B_recall.png)**| -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |eval|**[0.99551](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/private_deep-1B_recall.png)**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**[0.99541](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_deep-1B_recall.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**[0.99185](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_deep-1B_recall.png)**| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**[0.94437](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_deep-1B_recall.png)**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Deep1B Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |eval|**[968,840](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/private_deep-1B_throughput.png)**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**[210,403](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_deep-1B_throughput.png)**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**[94,042](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_deep-1B_throughput.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**[12,345](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_deep-1B_throughput.png)**| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**[5,035](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_deep-1B_throughput.png)**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Deep1B Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |eval|**[0.0025](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/private_deep-1B_power.png)**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**[0.0036](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_deep-1B_power.png)**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**[0.0104](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_deep-1B_power.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**[0.0352](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_deep-1B_power.png)**| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**[0.0923](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_deep-1B_power.png)**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Deep1B Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|---------|-----------------------|--------|-------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |eval|**$15,918.69** |$14,664.20|$1,254.49|$14,664.20 |1 |12,544.902| -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia |NVidia GPU |eval|**$150,863.29\*\*** |$150,000.00|$863.29|$150,000.00 |1 |8,632.870| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia |NVidia GPU |eval|**$303,647.91\*\*** |$300,000.00|$3,647.91|$150,000.00 |2 |36,479.145| -| 4|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |eval|**$472,764.09** |$440,438.00|$32,326.09|$22,021.90 |20 |323,260.873| -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |eval|**$513,869.50** |$501,539.94|$12,329.56|$55,726.66 |9 |123,295.635| -| 6|[-](-)|- |- |-|**-** |-|-|- |- |-| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### BigANN - -##### BigANN Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**[0.99977](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_bigann-1B_recall.png)** | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**[0.99882](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_bigann-1B_recall.png)** | -| 3|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |eval|**[0.99872](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/private_bigann-1B_recall.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**[0.99452](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_bigann-1B_recall.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**[0.93604](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_bigann-1B_recall.png)** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### BigANN Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |eval|**[764,700](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/private_bigann-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**[350,007](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_bigann-1B_throughput.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**[84,806](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_bigann-1B_throughput.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**[10,868](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_bigann-1B_throughput.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**[3,279](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_bigann-1B_throughput.png)** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### BigANN Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**[0.0020](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_bigann-1B_power.png)**| -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |eval|**[0.0022](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/private_bigann-1B_power.png)**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**[0.0119](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_bigann-1B_power.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**[0.0342](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_bigann-1B_power.png)**| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**[0.1623](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_bigann-1B_power.png)**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### BigANN Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|--------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |eval|**$15,372.40** |$14,664.20|$708.20|$14,664.20 |1 |7,082.016| -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia |NVidia GPU |eval|**$150,786.43\*\*** |$150,000.00|$786.43|$150,000.00 |1 |7,864.254| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia |NVidia GPU |eval|**$304,177.20\*\*** |$300,000.00|$4,177.20|$150,000.00 |2 |41,771.962| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |eval|**$569,253.60** |$557,266.60|$11,987.00|$55,726.66 |10 |119,870.019| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |eval|**$739,552.84** |$682,678.90|$56,873.94|$22,021.90 |31 |568,739.415| -| 6|[-](-)|- |- |-|**-** |-|-|- |- |-| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### MSTuring - -##### MSTuring Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|---------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**[0.99561](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_msturing-1B_recall.png)** | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**[0.99054](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_msturing-1B_recall.png)** | -| 3|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |eval|**[0.98330](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/private_msturing-1B_recall.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**[0.97719](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_msturing-1B_recall.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**[0.91513](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_msturing-1B_recall.png)** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSTuring Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |eval|**[393,528](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/private_msturing-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**[127,883](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_msturing-1B_throughput.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**[110,886](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_msturing-1B_throughput.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**[14,862](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_msturing-1B_throughput.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**[2,630](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_msturing-1B_throughput.png)** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSTuring Power Rankings - -|Rank|Submission |Team |Hardware |Status|W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|------|--------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**[0.0054](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_msturing-1B_power.png)** | -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |eval|**[0.0061](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/private_msturing-1B_power.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**[0.0099](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_msturing-1B_power.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**[0.0250](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_msturing-1B_power.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**[0.1874](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_msturing-1B_power.png)** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSTuring Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|------------------------------------|------------------------------|-----------------------|--------|--------------|--------|--------|---------|--------------|----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**$16,572.66** |$14,664.20|$1,908.46|$14,664.20 |1 |19,084.644 | -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |eval|**$152,142.96\*\*** |$150,000.00|$2,142.96|$150,000.00 |1 |21,429.628 | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**$153,483.45\*\*** |$150,000.00|$3,483.45|$150,000.00 |1 |34,834.523 | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**$398,832.13** |$390,086.62|$8,745.51|$55,726.66 |7 |87,455.147 | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**$924,531.60** |$858,854.10|$65,677.50|$22,021.90 |39 |656,775.000 | -| 6|[-](-) |- |- |-|**-** |-|-|- |- |- | - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### MSSpace - -##### MSSpace Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|---------| -| 1|[-](-) |- |- |-|**-** | -| 2|[-](-) |- |- |-|**-** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSSpace Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[-](-) |- |- |-|**-** | -| 2|[-](-) |- |- |-|**-** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.9 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.9 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSSpace Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[-](-) |- |- |-|**-** | -| 2|[-](-) |- |- |-|**-** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.9 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSSpace Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|-----------------------|------- |--------------|--------|--------|---------|--------------|----------| -| 1|[-](-)|- |- |-|**-** |-|-|- |- |- | -| 2|[-](-)|- |- |-|**-** |-|-|- |- |- | -| 3|[-](-)|- |- |-|**-** |-|-|- |- |- | -| 4|[-](-)|- |- |-|**-** |-|-|- |- |- | -| 5|[-](-)|- |- |-|**-** |-|-|- |- |- | -| 6|[-](-)|- |- |-|**-** |-|-|- |- |- | - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### Text2Image - -##### Text2Image Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**[0.63732](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_text2image-1B_recall.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**[0.62692](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_text2image-1B_recall.png)** | -| 3|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**[0.61895](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_text2image-1B_recall.png)** | -| 4|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**[0.60105](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_text2image-1B_recall.png)** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Text2Image Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**[20,765](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_text2image-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**[10,364](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_text2image-1B_throughput.png)** | -| 3|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**[2,154](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_text2image-1B_throughput.png)** | -| 4|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**[1,948](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_text2image-1B_throughput.png)** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.601 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.601 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Text2Image Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**[0.0441](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/private_text2image-1B_power.png)**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**[0.0710](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/private_text2image-1B_power.png)**| -| 3|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**[0.1091](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_text2image-1B_power.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**[0.2661](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_text2image-1B_power.png)**| -| 5|[-](-) |- |- |-|**-**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.601 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.601 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Text2Image Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|---------------------|------------------------------|---------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**$171,523.05** |$146,642.00|$24,881.05|$14,664.20 |10 |248,810.537| -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**$765,461.90\*\*** |$750,000.00|$15,461.90|$150,000.00 |5 |154,619.021| -| 3|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**$1,183,367.83** |$1,145,138.80|$38,229.03|$22,021.90 |52 |382,290.263| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**$2,712,384.33** |$2,619,153.02|$93,231.31|$55,726.66 |47 |932,313.075| -| 5|[-](-) |- |- |-|**-** |-|-|- |- |-| -| 6|[-](-) |- |- |-|**-** |-|-|- |- |-| - -* The operational point for ranking is 0.601 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.601 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### FBSimSearchNet - -##### FBSimSearchNet AP Rankings - -|Rank|Submission |Team |Hardware |Status |AP | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**[0.99672](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_ssnpp-1B_recall.png)** | -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**[0.98567](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_ssnpp-1B_recall.png)** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### FBSimSearchNet Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**[9,343](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_ssnpp-1B_throughput.png)** | -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**[6,256](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_ssnpp-1B_throughput.png)** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.9 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.9 average precision. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - - -##### FBSimSearchNet Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**[0.0433](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/private_ssnpp-1B_power.png)**| -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**[0.0847](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/private_ssnpp-1B_power.png)**| -| 3|[-](-) |- |- |-|**-**| -| 4|[-](-) |- |- |-|**-**| -| 5|[-](-) |- |- |-|**-**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.9 average precision. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### FBSimSearchNet Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|---------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |eval|**$382,013.99** |$352,350.40|$29,663.59|$22,021.90 |16 |296,635.913| -| 2|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |eval|**$628,176.55** |$612,993.26|$15,183.29|$55,726.66 |11 |151,832.906| -| 3|[-](-)|- |- |-|**-** | -| -| -| -| -| -| 4|[-](-)|- |- |-|**-** | -| -| -| -| -| - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.9 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. diff --git a/t3/LEADERBOARDS_PRIVATE_REJECT_ANOMALIES.md b/t3/LEADERBOARDS_PRIVATE_REJECT_ANOMALIES.md deleted file mode 100644 index 45c1130d6..000000000 --- a/t3/LEADERBOARDS_PRIVATE_REJECT_ANOMALIES.md +++ /dev/null @@ -1,566 +0,0 @@ -# T3 Track Private Dataset Leaderboards After Rejecting Anomalies - -Please note that all rankings and winners are unofficial until all [open tasks and issues](TASKS_ISSUES_RESOLUTIONS.md) are resolved. - -## Rankings By Category - -### Rankings By Submission Name (alphabetical) - -|Submission |Team |Hardware |[Recall Rank](#recall-or-ap-rankings)|[Thru-put Rank](#throughput-rankings)|[Power Rank](#power-rankings)|[Cost Rank](#cost-rankings)|Status |Anomalies|Evaluator|Algo |Runs | -|--------------------|-----------|----------|---------|---------|---------|--------|---------|---------|---------|---------|--------| -|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |*NA* |*NA* |*NA* |*NA* |eval |*NA* |[Harsha Simhadri](https://github.com/harsha-simhadri) |- |- | -|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |[5](#recall-or-ap-rankings) |[5](#throughput-rankings) |[5](#power-rankings) |[4](#cost-rankings) |eval |0/49 |[George Williams](https://github.com/sourcesync) |- |- | -|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |[3](#recall-or-ap-rankings) |[4](#throughput-rankings) |[4](#power-rankings) |[5](#cost-rankings) |eval |0/50 |[George Williams](https://github.com/sourcesync) |- |- | -|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |[1](#recall-or-ap-rankings) |[3](#throughput-rankings) |[1](#power-rankings) |[2](#cost-rankings)\*\* |eval |[6/40](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/ANOMALIES.md) |[George Williams](https://github.com/sourcesync) |- |- | -|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |[4](#recall-or-ap-rankings) |[1](#throughput-rankings) |[3](#power-rankings) |[3](#cost-rankings)\*\* |eval |[3/30](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/ANOMALIES.md) |[George Williams](https://github.com/sourcesync) |- |- | -|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |[2](#recall-or-ap-rankings) |[2](#throughput-rankings) |[2](#power-rankings) |[1](#cost-rankings)|eval |[4/40](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/ANOMALIES.md) |[George Williams](https://github.com/sourcesync) |- |-| - -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - * *NQ* = not qualified - * *NA* = data is not yet available, or has not yet been processed - -* *Anomalies* are defined as queries that could potentially be the result of query response caching, a violation of the competition. Our detection method looks for a 30% or more improvement in the batch query latency between the first and last query of a query group (5). Participants have been given a chance to explain why detected anomalies (if any) are not a result of query response caching. In general, our analysis did not uncover this symptom of systematic query response caching from any submission. Also, if we throw out the anomalous data points, the adjusted leaderboard rankings (above) do not change even though some scores change slightly. - -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -### Rankings Per Benchmark - -#### Recall Or AP Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-recall-rankings)|[BigANN](#bigann-recall-rankings)|[MSTuring](#msturing-recall-rankings)|[MSSpace](#msspace-recall-rankings)|[Text2Image](#text2image-recall-rankings)|[FBSSNet](#fbsimsearchnet-ap-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|-------| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |eval|**0.225**|0.99541 |0.99882 |0.99054 |- |0.63732 |- | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |eval|**0.224**|0.99872 |0.99977 |0.99561 |- |0.62692 |- | -| 3|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |eval|**0.197**|0.99185 |0.99452 |0.97719 |- |0.61895 |0.99672 | -| 4|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |eval|**0.094**|0.95788 |0.96978 |0.96186 |- |- |- | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |eval|**baseline**|0.94437 |0.93604 |0.91513 |- |0.60105 |0.98567 | -| 6|[-](-)|-|- |-|**-**|- |- |- |- |- |- | - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -#### Throughput Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-throughput-rankings)|[BigANN](#bigann-throughput-rankings)|[MSTuring](#msturing-throughput-rankings)|[MSSpace](#msspace-throughput-rankings)|[Text2Image](#text2image-throughput-rankings)|[FBSSNet](#fbsimsearchnet-throughput-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|--------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |eval|**2116124**|968,840 |764,700 |393,528 |- |- |- | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |eval|**685763**|210,403 |350,007 |127,883 |- |10,364 |- | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |eval|**297608**|94,042 |84,806 |110,886 |- |20,765 |- | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |eval|**30425**|12,345 |10,868 |14,862 |- |2,154 |9,343 | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |eval|**baseline**|5,035 |3,279 |2,630 |- |1,948 |6,256 | -| 6|[-](-)|-|- |-|**-**|- |- |- |- |- |- | - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -#### Power Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-power-rankings)|[BigANN](#bigann-power-rankings)|[MSTuring](#msturing-power-rankings)|[MSSpace](#msspace-power-rankings)|[Text2Image](#text2image-power-rankings)|[FBSSNet](#fbsimsearchnet-power-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|-----|-----| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |eval|**-0.475**|0.0104 |0.0119 |0.0099 |- |0.0441|-| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |eval|**-0.469**|0.0036 |0.0020 |0.0054 |- |0.0710|-| -| 3|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |eval|**-0.431**|0.0025 |0.0022 |0.0061 |- |-|-| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |eval|**-0.232**|0.0352 |0.0342 |0.0250 |- |0.2661|0.0433| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |eval|**baseline**|0.0923 |0.1623 |0.1874 |- |0.1091|0.0847| -| 6|[-](-)|-|- |-|**-**|- |- |- |- |-|-| - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -#### Cost Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-cost-rankings)|[BigANN](#bigann-cost-rankings)|[MSTuring](#msturing-cost-rankings)|[MSSpace](#msspace-cost-rankings)|[Text2Image](#text2image-cost-rankings)|[FBSSNet](#fbsimsearchnet-cost-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|--------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |eval|**$-3,100,829.55**|$15,918.69 |$15,372.40 |$16,572.66 |- |$171,523.05 |- | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |eval|**$-1,793,445.89\*\***|$303,647.91 |$304,177.20 |$153,483.45 |- |$765,461.90 |- | -| 3|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |eval|**$-1,683,055.85\*\***|$150,863.29 |$150,786.43 |$152,142.96 |- |- |- | -| 4|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |eval|**baseline**|$472,764.09 |$739,552.84 |$924,531.60 |- |$1,183,367.83 |$382,013.99 | -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |eval|**$1,120,285.77**|$513,869.50 |$569,253.60 |$398,832.13 |- |$2,712,384.33 |$628,176.55 | -| 6|[-](-)|-|- |-|**-**|- |- |- |- |- |- | - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -### Rankings Per Database - -#### Deep1B - -##### Deep1B Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**0.99872**| -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**0.99541**| -| 3|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**0.99185**| -| 4|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |eval|**0.95788**| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**0.94437**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Deep1B Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |eval|**968,840**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**210,403**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**94,042**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**12,345**| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**5,035**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Deep1B Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |eval|**0.0025**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**0.0036**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**0.0104**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**0.0352**| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**0.0923**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Deep1B Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|---------|-----------------------|--------|-------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |eval|**$15,918.69** |$14,664.20|$1,254.49|$14,664.20 |1 |12,544.902| -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia |NVidia GPU |eval|**$150,863.29\*\*** |$150,000.00|$863.29|$150,000.00 |1 |8,632.870| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia |NVidia GPU |eval|**$303,647.91\*\*** |$300,000.00|$3,647.91|$150,000.00 |2 |36,479.145| -| 4|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |eval|**$472,764.09** |$440,438.00|$32,326.09|$22,021.90 |20 |323,260.873| -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |eval|**$513,869.50** |$501,539.94|$12,329.56|$55,726.66 |9 |123,295.635| -| 6|[-](-)|- |- |-|**-** |-|-|- |- |-| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### BigANN - -##### BigANN Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**0.99977** | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**0.99882** | -| 3|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**0.99452** | -| 4|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |eval|**0.96978** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**0.93604** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### BigANN Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |eval|**764,700** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**350,007** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**84,806** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**10,868** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**3,279** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### BigANN Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**0.0020**| -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |eval|**0.0022**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**0.0119**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**0.0342**| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**0.1623**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### BigANN Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|--------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |eval|**$15,372.40** |$14,664.20|$708.20|$14,664.20 |1 |7,082.016| -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia |NVidia GPU |eval|**$150,786.43\*\*** |$150,000.00|$786.43|$150,000.00 |1 |7,864.254| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia |NVidia GPU |eval|**$304,177.20\*\*** |$300,000.00|$4,177.20|$150,000.00 |2 |41,771.962| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |eval|**$569,253.60** |$557,266.60|$11,987.00|$55,726.66 |10 |119,870.019| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |eval|**$739,552.84** |$682,678.90|$56,873.94|$22,021.90 |31 |568,739.415| -| 6|[-](-)|- |- |-|**-** |-|-|- |- |-| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### MSTuring - -##### MSTuring Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|---------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**0.99561** | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**0.99054** | -| 3|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**0.97719** | -| 4|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |eval|**0.96186** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**0.91513** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSTuring Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |eval|**393,528** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**127,883** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**110,886** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**14,862** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**2,630** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSTuring Power Rankings - -|Rank|Submission |Team |Hardware |Status|W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|------|--------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**0.0054** | -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |eval|**0.0061** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**0.0099** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**0.0250** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**0.1874** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSTuring Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|------------------------------------|------------------------------|-----------------------|--------|--------------|--------|--------|---------|--------------|----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**$16,572.66** |$14,664.20|$1,908.46|$14,664.20 |1 |19,084.644 | -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |eval|**$152,142.96\*\*** |$150,000.00|$2,142.96|$150,000.00 |1 |21,429.628 | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**$153,483.45\*\*** |$150,000.00|$3,483.45|$150,000.00 |1 |34,834.523 | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**$398,832.13** |$390,086.62|$8,745.51|$55,726.66 |7 |87,455.147 | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**$924,531.60** |$858,854.10|$65,677.50|$22,021.90 |39 |656,775.000 | -| 6|[-](-) |- |- |-|**-** |-|-|- |- |- | - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### MSSpace - -##### MSSpace Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|---------| -| 1|[-](-) |- |- |-|**-** | -| 2|[-](-) |- |- |-|**-** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSSpace Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[-](-) |- |- |-|**-** | -| 2|[-](-) |- |- |-|**-** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.9 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.9 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSSpace Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[-](-) |- |- |-|**-** | -| 2|[-](-) |- |- |-|**-** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.9 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSSpace Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|-----------------------|------- |--------------|--------|--------|---------|--------------|----------| -| 1|[-](-)|- |- |-|**-** |-|-|- |- |- | -| 2|[-](-)|- |- |-|**-** |-|-|- |- |- | -| 3|[-](-)|- |- |-|**-** |-|-|- |- |- | -| 4|[-](-)|- |- |-|**-** |-|-|- |- |- | -| 5|[-](-)|- |- |-|**-** |-|-|- |- |- | -| 6|[-](-)|- |- |-|**-** |-|-|- |- |- | - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### Text2Image - -##### Text2Image Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**0.63732** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**0.62692** | -| 3|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**0.61895** | -| 4|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**0.60105** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Text2Image Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**20,765** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**10,364** | -| 3|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**2,154** | -| 4|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**1,948** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.601 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.601 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Text2Image Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**0.0441**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**0.0710**| -| 3|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**0.1091**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**0.2661**| -| 5|[-](-) |- |- |-|**-**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.601 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.601 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Text2Image Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|---------------------|------------------------------|---------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |eval|**$171,523.05** |$146,642.00|$24,881.05|$14,664.20 |10 |248,810.537| -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |eval|**$765,461.90\*\*** |$750,000.00|$15,461.90|$150,000.00 |5 |154,619.021| -| 3|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**$1,183,367.83** |$1,145,138.80|$38,229.03|$22,021.90 |52 |382,290.263| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**$2,712,384.33** |$2,619,153.02|$93,231.31|$55,726.66 |47 |932,313.075| -| 5|[-](-) |- |- |-|**-** |-|-|- |- |-| -| 6|[-](-) |- |- |-|**-** |-|-|- |- |-| - -* The operational point for ranking is 0.601 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.601 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### FBSimSearchNet - -##### FBSimSearchNet AP Rankings - -|Rank|Submission |Team |Hardware |Status |AP | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**0.99672** | -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**0.98567** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### FBSimSearchNet Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**9,343** | -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**6,256** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.9 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.9 average precision. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - - -##### FBSimSearchNet Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |eval|**0.0433**| -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |eval|**0.0847**| -| 3|[-](-) |- |- |-|**-**| -| 4|[-](-) |- |- |-|**-**| -| 5|[-](-) |- |- |-|**-**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.9 average precision. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### FBSimSearchNet Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|---------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |eval|**$382,013.99** |$352,350.40|$29,663.59|$22,021.90 |16 |296,635.913| -| 2|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |eval|**$628,176.55** |$612,993.26|$15,183.29|$55,726.66 |11 |151,832.906| -| 3|[-](-)|- |- |-|**-** | -| -| -| -| -| -| 4|[-](-)|- |- |-|**-** | -| -| -| -| -| - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.9 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. diff --git a/t3/LEADERBOARDS_PUBLIC.md b/t3/LEADERBOARDS_PUBLIC.md deleted file mode 100644 index ecc07019f..000000000 --- a/t3/LEADERBOARDS_PUBLIC.md +++ /dev/null @@ -1,566 +0,0 @@ -# T3 Track Public Dataset Leaderboards - -Please note that all rankings and winners are unofficial until all [open tasks and issues](TASKS_ISSUES_RESOLUTIONS.md) are resolved. - -## Rankings By Category - -### Rankings By Submission Name (alphabetical) - -|Submission |Team |Hardware |[Recall Rank](#recall-or-ap-rankings)|[Thru-put Rank](#throughput-rankings)|[Power Rank](#power-rankings)|[Cost Rank](#cost-rankings)|Status |Anomalies|Evaluator|Algo |Runs | -|--------------------|-----------|----------|---------|---------|---------|--------|---------|---------|---------|---------|--------| -|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |[1](#recall-or-ap-rankings) |[5](#throughput-rankings) |*NQ* |*NQ* |final |*NA* |[Harsha Simhadri](https://github.com/harsha-simhadri) |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/diskann-t2.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/EvalPublic.ipynb) | -|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |[6](#recall-or-ap-rankings) |[6](#throughput-rankings) |[5](#power-rankings) |[5](#cost-rankings) |final |0/58 |[George Williams](https://github.com/sourcesync) |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/faiss_t3.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/EvalPublic.ipynb) | -|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |[4](#recall-or-ap-rankings) |[4](#throughput-rankings) |[4](#power-rankings) |[4](#cost-rankings) |final |0/60 |[George Williams](https://github.com/sourcesync) |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/gemini.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/EvalPublic.ipynb) | -|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |[3](#recall-or-ap-rankings) |[3](#throughput-rankings) |[2](#power-rankings) |[2](#cost-rankings)\*\* |final |[6/50](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/ANOMALIES.md) |[George Williams](https://github.com/sourcesync) |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/cuanns_ivfpq.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/EvalPublic.ipynb) | -|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |[5](#recall-or-ap-rankings) |[1](#throughput-rankings) |[3](#power-rankings) |[3](#cost-rankings)\*\* |final |[4/40](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/ANOMALIES.md) |[George Williams](https://github.com/sourcesync) |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/cuanns_multigpu.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/EvalPublic.ipynb) | -|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |[2](#recall-or-ap-rankings) |[2](#throughput-rankings) |[1](#power-rankings) |[1](#cost-rankings)|final |[5/50](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/ANOMALIES.md) |[George Williams](https://github.com/sourcesync) |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/graphann.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/EvalPublic.ipynb)| - -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - * *NQ* = not qualified - * *NA* = data is not yet available, or has not yet been processed - -* *Anomalies* are defined as queries that could potentially be the result of query response caching, a violation of the competition. Our detection method looks for a 30% or more improvement in the batch query latency between the first and last query of a query group (5). Participants have been given a chance to explain why detected anomalies (if any) are not a result of query response caching. In general, our analysis did not uncover this symptom of systematic query response caching from any submission. Also, if we throw out the anomalous data points, the [adjusted leaderboard rankings](LEADERBOARDS_PUBLIC_REJECT_ANOMALIES.md) do not change even though some scores change slightly. - -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -### Rankings Per Benchmark - -#### Recall Or AP Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-recall-rankings)|[BigANN](#bigann-recall-rankings)|[MSTuring](#msturing-recall-rankings)|[MSSpace](#msspace-recall-rankings)|[Text2Image](#text2image-recall-rankings)|[FBSSNet](#fbsimsearchnet-ap-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|-------| -| 1|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md)|Microsoft Research India(*org*)|Dell PowerEdge |final|**0.410**|[0.99821](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/deep-1B_recall.png) |[0.99976](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/bigann-1B_recall.png) |[0.99444](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msturing-1B_recall.png) |[0.99342](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msspacev-1B_recall.png) |[0.98130](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/text2image-1B_recall.png) |- | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |final|**0.409**|[0.99882](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_recall.png) |[0.99978](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_recall.png) |[0.99568](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_recall.png) |[0.99835](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_recall.png) |[0.97340](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_recall.png) |- | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |final|**0.368**|[0.99543](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_recall.png) |[0.99881](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_recall.png) |[0.98993](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_recall.png) |[0.99429](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_recall.png) |[0.94692](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_recall.png) |- | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |final|**0.339**|[0.99208](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_recall.png) |[0.99328](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_recall.png) |[0.97841](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_recall.png) |[0.98622](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_recall.png) |[0.92855](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_recall.png) |[0.99684](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_recall.png) | -| 5|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |final|**0.268**|[0.99504](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_recall.png) |[0.99815](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_recall.png) |[0.98399](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_recall.png) |[0.98785](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_recall.png) |- |- | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|[0.94275](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_recall.png) |[0.93260](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_recall.png) |[0.91322](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_recall.png) |[0.90853](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_recall.png) |[0.86028](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_recall.png) |[0.97863](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_recall.png) | - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -#### Throughput Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-throughput-rankings)|[BigANN](#bigann-throughput-rankings)|[MSTuring](#msturing-throughput-rankings)|[MSSpace](#msspace-throughput-rankings)|[Text2Image](#text2image-throughput-rankings)|[FBSSNet](#fbsimsearchnet-throughput-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|--------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |final|**2959313**|[801,694](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_throughput.png) |[747,421](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_throughput.png) |[584,293](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_throughput.png) |[839,749](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_throughput.png) |- |- | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |final|**853257**|[196,546](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_throughput.png) |[335,991](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_throughput.png) |[161,463](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_throughput.png) |[157,828](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_throughput.png) |[17,063](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_throughput.png) |- | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |final|**393318**|[91,701](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_throughput.png) |[80,109](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_throughput.png) |[109,745](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_throughput.png) |[108,302](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_throughput.png) |[19,094](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_throughput.png) |- | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |final|**52429**|[10,704](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_throughput.png) |[10,672](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_throughput.png) |[21,780](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_throughput.png) |[16,422](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_throughput.png) |[4,838](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_throughput.png) |[9,345](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_throughput.png) | -| 5|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md)|Microsoft Research India(*org*)|Dell PowerEdge |final|**49398**|[12,927](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/deep-1B_throughput.png) |[19,094](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/bigann-1B_throughput.png) |[17,201](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msturing-1B_throughput.png) |[6,503](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msspacev-1B_throughput.png) |[9,307](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/text2image-1B_throughput.png) |- | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|[4,464](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_throughput.png) |[3,271](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_throughput.png) |[2,845](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_throughput.png) |[3,265](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_throughput.png) |[1,789](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_throughput.png) |[5,699](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_throughput.png) | - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -#### Power Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-power-rankings)|[BigANN](#bigann-power-rankings)|[MSTuring](#msturing-power-rankings)|[MSSpace](#msspace-power-rankings)|[Text2Image](#text2image-power-rankings)|[FBSSNet](#fbsimsearchnet-power-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|-----|-----| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|Intel|Intel Optane |final|**-0.648**|[0.0041](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_power.png) |[0.0022](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_power.png) |[0.0048](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_power.png) |[0.0049](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_power.png) |[0.0446](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_power.png)|-| -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|NVidia|NVidia GPU |final|**-0.619**|[0.0112](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_power.png) |[0.0119](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_power.png) |[0.0090](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_power.png) |[0.0090](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_power.png) |[0.0480](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_power.png)|-| -| 3|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |final|**-0.583**|[0.0029](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_power.png) |[0.0024](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_power.png) |[0.0049](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_power.png) |[0.0023](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_power.png) |-|-| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |final|**-0.513**|[0.0337](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_power.png) |[0.0341](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_power.png) |[0.0236](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_power.png) |[0.0230](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_power.png) |[0.1242](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_power.png)|[0.0469](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_power.png)| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|[0.1117](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_power.png) |[0.1576](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_power.png) |[0.1743](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_power.png) |[0.1520](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_power.png) |[0.1128](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_power.png)|[0.0904](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_power.png)| -| 6|[-](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|-|- |-|**-**|- |- |- |- |-|-| - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -#### Cost Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-cost-rankings)|[BigANN](#bigann-cost-rankings)|[MSTuring](#msturing-cost-rankings)|[MSSpace](#msspace-cost-rankings)|[Text2Image](#text2image-cost-rankings)|[FBSSNet](#fbsimsearchnet-cost-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|--------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |final|**$-3,978,198.83**|$16,086.82 |$15,439.92 |$16,347.45 |$16,382.81 |$103,599.49 |- | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |final|**$-2,314,829.98\*\***|$303,929.39 |$304,166.48 |$153,151.00 |$153,155.12 |$916,823.34 |- | -| 3|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |final|**$-2,268,943.17\*\***|$151,009.85 |$150,824.13 |$151,726.30 |$150,816.00 |- |- | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |final|**$-907,570.13**|$569,058.09 |$569,210.35 |$286,911.87 |$398,163.18 |$1,213,773.56 |$629,442.91 | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|$545,633.16 |$737,886.17 |$853,857.46 |$735,942.66 |$1,272,735.86 |$428,074.79 | -| 6|[-](-)|-|- |-|**-**|- |- |- |- |- |- | - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -### Rankings Per Database - -#### Deep1B - -##### Deep1B Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.99882](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_recall.png)**| -| 2|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[0.99821](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/deep-1B_recall.png)**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.99543](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_recall.png)**| -| 4|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.99504](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_recall.png)**| -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.99208](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_recall.png)**| -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.94275](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_recall.png)**| - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Deep1B Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[801,694](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_throughput.png)**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[196,546](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_throughput.png)**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[91,701](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_throughput.png)**| -| 4|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[12,927](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/deep-1B_throughput.png)**| -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[10,704](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_throughput.png)**| -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[4,464](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_throughput.png)**| - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Deep1B Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.0029](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_power.png)**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.0041](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_power.png)**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.0112](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_power.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.0337](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_power.png)**| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1117](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_power.png)**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Deep1B Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|---------|-----------------------|--------|-------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |final|**$16,086.82** |$14,664.20|$1,422.62|$14,664.20 |1 |14,226.208| -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia |NVidia GPU |final|**$151,009.85\*\*** |$150,000.00|$1,009.85|$150,000.00 |1 |10,098.482| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia |NVidia GPU |final|**$303,929.39\*\*** |$300,000.00|$3,929.39|$150,000.00 |2 |39,293.902| -| 4|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$545,633.16** |$506,503.70|$39,129.46|$22,021.90 |23 |391,294.584| -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |final|**$569,058.09** |$557,266.60|$11,791.49|$55,726.66 |10 |117,914.908| -| 6|[-](-)|- |- |-|**-** |-|-|- |- |-| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### BigANN - -##### BigANN Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.99978](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_recall.png)** | -| 2|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[0.99976](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/bigann-1B_recall.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.99881](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_recall.png)** | -| 4|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.99815](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_recall.png)** | -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.99328](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_recall.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.93260](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_recall.png)** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### BigANN Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[747,421](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[335,991](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_throughput.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[80,109](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_throughput.png)** | -| 4|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[19,094](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/bigann-1B_throughput.png)** | -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[10,672](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_throughput.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[3,271](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_throughput.png)** | - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### BigANN Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.0022](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_power.png)**| -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.0024](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_power.png)**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.0119](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_power.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.0341](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_power.png)**| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1576](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_power.png)**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### BigANN Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|--------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |final|**$15,439.92** |$14,664.20|$775.72|$14,664.20 |1 |7,757.221| -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia |NVidia GPU |final|**$150,824.13\*\*** |$150,000.00|$824.13|$150,000.00 |1 |8,241.343| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia |NVidia GPU |final|**$304,166.48\*\*** |$300,000.00|$4,166.48|$150,000.00 |2 |41,664.844| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |final|**$569,210.35** |$557,266.60|$11,943.75|$55,726.66 |10 |119,437.537| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$737,886.17** |$682,678.90|$55,207.27|$22,021.90 |31 |552,072.703| -| 6|[-](-)|- |- |-|**-** |-|-|- |- |-| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### MSTuring - -##### MSTuring Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|---------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.99568](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_recall.png)** | -| 2|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[0.99444](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msturing-1B_recall.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.98993](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_recall.png)** | -| 4|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.98399](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_recall.png)** | -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.97841](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_recall.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.91322](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_recall.png)** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSTuring Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[584,293](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[161,463](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_throughput.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[109,745](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_throughput.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[21,780](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_throughput.png)** | -| 5|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[17,201](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msturing-1B_throughput.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[2,845](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_throughput.png)** | - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSTuring Power Rankings - -|Rank|Submission |Team |Hardware |Status|W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|------|--------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.0048](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_power.png)** | -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.0049](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_power.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.0090](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_power.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.0236](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_power.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1743](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_power.png)** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSTuring Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|------------------------------------|------------------------------|-----------------------|--------|--------------|--------|--------|---------|--------------|----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**$16,347.45** |$14,664.20|$1,683.25|$14,664.20 |1 |16,832.451 | -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**$151,726.30\*\*** |$150,000.00|$1,726.30|$150,000.00 |1 |17,262.993 | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**$153,151.00\*\*** |$150,000.00|$3,151.00|$150,000.00 |1 |31,509.973 | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**$286,911.87** |$278,633.30|$8,278.57|$55,726.66 |5 |82,785.683 | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**$853,857.46** |$792,788.40|$61,069.06|$22,021.90 |36 |610,690.611 | -| 6|[-](-) |- |- |-|**-** |-|-|- |- |- | - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### MSSpace - -##### MSSpace Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.99835](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_recall.png)** | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.99429](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_recall.png)** | -| 3|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[0.99342](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msspacev-1B_recall.png)** | -| 4|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.98785](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_recall.png)** | -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.98622](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_recall.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.90853](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_recall.png)** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSSpace Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[839,749](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[157,828](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_throughput.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[108,302](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_throughput.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[16,422](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_throughput.png)** | -| 5|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[6,503](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msspacev-1B_throughput.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[3,265](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_throughput.png)** | - -* The operational point for ranking is 0.9 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.9 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSSpace Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.0023](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_power.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.0049](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_power.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.0090](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_power.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.0230](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_power.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1520](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_power.png)** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.9 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSSpace Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|-----------------------|------- |--------------|--------|--------|---------|--------------|----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |final|**$16,382.81** |$14,664.20|$1,718.61|$14,664.20 |1 |17,186.056 | -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia |NVidia GPU |final|**$150,816.00\*\*** |$150,000.00|$816.00|$150,000.00 |1 |8,160.006 | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia |NVidia GPU |final|**$153,155.12\*\*** |$150,000.00|$3,155.12|$150,000.00 |1 |31,551.163 | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |final|**$398,163.18** |$390,086.62|$8,076.56|$55,726.66 |7 |80,765.638 | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$735,942.66** |$682,678.90|$53,263.76|$22,021.90 |31 |532,637.584 | -| 6|[-](-)|- |- |-|**-** |-|-|- |- |- | - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### Text2Image - -##### Text2Image Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[0.98130](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/text2image-1B_recall.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.97340](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_recall.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.94692](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_recall.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.92855](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_recall.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.86028](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_recall.png)** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Text2Image Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[19,094](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[17,063](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_throughput.png)** | -| 3|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[9,307](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/text2image-1B_throughput.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[4,838](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_throughput.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[1,789](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_throughput.png)** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.860 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.860 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Text2Image Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.0446](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_power.png)**| -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.0480](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_power.png)**| -| 3|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1128](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_power.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.1242](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_power.png)**| -| 5|[-](-) |- |- |-|**-**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.86 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.86 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Text2Image Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|---------------------|------------------------------|---------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**$103,599.49** |$87,985.20|$15,614.29|$14,664.20 |6 |156,142.873| -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**$916,823.34\*\*** |$900,000.00|$16,823.34|$150,000.00 |6 |168,233.421| -| 3|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**$1,213,773.56** |$1,170,259.86|$43,513.70|$55,726.66 |21 |435,137.010| -| 4|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**$1,272,735.86** |$1,233,226.40|$39,509.46|$22,021.90 |56 |395,094.625| -| 5|[-](-) |- |- |-|**-** |-|-|- |- |-| -| 6|[-](-) |- |- |-|**-** |-|-|- |- |-| - -* The operational point for ranking is 0.86 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.86 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### FBSimSearchNet - -##### FBSimSearchNet AP Rankings - -|Rank|Submission |Team |Hardware |Status |AP | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.99684](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_recall.png)** | -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.97863](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_recall.png)** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### FBSimSearchNet Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[9,345](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_throughput.png)** | -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[5,699](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_throughput.png)** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.9 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.9 average precision. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - - -##### FBSimSearchNet Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.0469](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_power.png)**| -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.0904](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_power.png)**| -| 3|[-](-) |- |- |-|**-**| -| 4|[-](-) |- |- |-|**-**| -| 5|[-](-) |- |- |-|**-**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.9 average precision. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### FBSimSearchNet Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|---------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$428,074.79** |$396,394.20|$31,680.59|$22,021.90 |18 |316,805.859| -| 2|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |final|**$629,442.91** |$612,993.26|$16,449.65|$55,726.66 |11 |164,496.451| -| 3|[-](-)|- |- |-|**-** | -| -| -| -| -| -| 4|[-](-)|- |- |-|**-** | -| -| -| -| -| - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.9 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. diff --git a/t3/LEADERBOARDS_PUBLIC_REJECT_ANOMALIES.md b/t3/LEADERBOARDS_PUBLIC_REJECT_ANOMALIES.md deleted file mode 100644 index c36c071fe..000000000 --- a/t3/LEADERBOARDS_PUBLIC_REJECT_ANOMALIES.md +++ /dev/null @@ -1,566 +0,0 @@ -# T3 Track Public Dataset Leaderboards After Rejecting Anomalies - -Please note that all rankings and winners are unofficial until all [open tasks and issues](TASKS_ISSUES_RESOLUTIONS.md) are resolved. - -## Rankings By Category - -### Rankings By Submission Name (alphabetical) - -|Submission |Team |Hardware |[Recall Rank](#recall-or-ap-rankings)|[Thru-put Rank](#throughput-rankings)|[Power Rank](#power-rankings)|[Cost Rank](#cost-rankings)|Status |Anomalies|Evaluator|Algo |Runs | -|--------------------|-----------|----------|---------|---------|---------|--------|---------|---------|---------|---------|--------| -|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |[1](#recall-or-ap-rankings) |[5](#throughput-rankings) |*NQ* |*NQ* |final |*NA* |[Harsha Simhadri](https://github.com/harsha-simhadri) |- |- | -|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |[6](#recall-or-ap-rankings) |[6](#throughput-rankings) |[5](#power-rankings) |[5](#cost-rankings) |final |0/58 |[George Williams](https://github.com/sourcesync) |- |- | -|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |[4](#recall-or-ap-rankings) |[4](#throughput-rankings) |[4](#power-rankings) |[4](#cost-rankings) |final |0/60 |[George Williams](https://github.com/sourcesync) |- |- | -|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |[3](#recall-or-ap-rankings) |[3](#throughput-rankings) |[2](#power-rankings) |[2](#cost-rankings)\*\* |final |[6/50](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/ANOMALIES.md) |[George Williams](https://github.com/sourcesync) |- |- | -|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |[5](#recall-or-ap-rankings) |[1](#throughput-rankings) |[3](#power-rankings) |[3](#cost-rankings)\*\* |final |[4/40](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/ANOMALIES.md) |[George Williams](https://github.com/sourcesync) |- |- | -|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |[2](#recall-or-ap-rankings) |[2](#throughput-rankings) |[1](#power-rankings) |[1](#cost-rankings)|final |[5/50](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/ANOMALIES.md) |[George Williams](https://github.com/sourcesync) |- |-| - -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - * *NQ* = not qualified - * *NA* = data is not yet available, or has not yet been processed - -* *Anomalies* are defined as queries that could potentially be the result of query response caching, a violation of the competition. Our detection method looks for a 30% or more improvement in the batch query latency between the first and last query of a query group (5). Participants have been given a chance to explain why detected anomalies (if any) are not a result of query response caching. In general, our analysis did not uncover this symptom of systematic query response caching from any submission. Also, if we throw out the anomalous data points, the adjusted leaderboard rankings (above) do not change even though some scores change slightly. - -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -### Rankings Per Benchmark - -#### Recall Or AP Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-recall-rankings)|[BigANN](#bigann-recall-rankings)|[MSTuring](#msturing-recall-rankings)|[MSSpace](#msspace-recall-rankings)|[Text2Image](#text2image-recall-rankings)|[FBSSNet](#fbsimsearchnet-ap-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|-------| -| 1|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md)|Microsoft Research India(*org*)|Dell PowerEdge |final|**0.410**|0.99821 |0.99976 |0.99444 |0.99342 |0.98130 |- | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |final|**0.409**|0.99882 |0.99978 |0.99568 |0.99835 |0.97340 |- | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |final|**0.368**|0.99543 |0.99881 |0.98993 |0.99429 |0.94692 |- | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |final|**0.339**|0.99208 |0.99328 |0.97841 |0.98622 |0.92855 |0.99684 | -| 5|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |final|**0.166**|0.95736 |0.96750 |0.96286 |0.97541 |- |- | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|0.94275 |0.93260 |0.91322 |0.90853 |0.86028 |0.97863 | - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -#### Throughput Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-throughput-rankings)|[BigANN](#bigann-throughput-rankings)|[MSTuring](#msturing-throughput-rankings)|[MSSpace](#msspace-throughput-rankings)|[Text2Image](#text2image-throughput-rankings)|[FBSSNet](#fbsimsearchnet-throughput-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|--------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |final|**2959313**|801,694 |747,421 |584,293 |839,749 |- |- | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |final|**851327**|196,546 |335,991 |161,463 |155,899 |17,063 |- | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |final|**393318**|91,701 |80,109 |109,745 |108,302 |19,094 |- | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |final|**52429**|10,704 |10,672 |21,780 |16,422 |4,838 |9,345 | -| 5|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md)|Microsoft Research India(*org*)|Dell PowerEdge |final|**49398**|12,927 |19,094 |17,201 |6,503 |9,307 |- | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|4,464 |3,271 |2,845 |3,265 |1,789 |5,699 | - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -#### Power Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-power-rankings)|[BigANN](#bigann-power-rankings)|[MSTuring](#msturing-power-rankings)|[MSSpace](#msspace-power-rankings)|[Text2Image](#text2image-power-rankings)|[FBSSNet](#fbsimsearchnet-power-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|-----|-----| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|Intel|Intel Optane |final|**-0.648**|0.0041 |0.0022 |0.0048 |0.0050 |0.0446|-| -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|NVidia|NVidia GPU |final|**-0.619**|0.0112 |0.0119 |0.0090 |0.0090 |0.0480|-| -| 3|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |final|**-0.583**|0.0029 |0.0024 |0.0049 |0.0023 |-|-| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |final|**-0.513**|0.0337 |0.0341 |0.0236 |0.0230 |0.1242|0.0469| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|0.1117 |0.1576 |0.1743 |0.1520 |0.1128|0.0904| -| 6|[-](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|-|- |-|**-**|- |- |- |- |-|-| - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -#### Cost Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-cost-rankings)|[BigANN](#bigann-cost-rankings)|[MSTuring](#msturing-cost-rankings)|[MSSpace](#msspace-cost-rankings)|[Text2Image](#text2image-cost-rankings)|[FBSSNet](#fbsimsearchnet-cost-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|--------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |final|**$-3,978,172.56**|$16,086.82 |$15,439.92 |$16,347.45 |$16,409.08 |$103,599.49 |- | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |final|**$-2,314,829.98\*\***|$303,929.39 |$304,166.48 |$153,151.00 |$153,155.12 |$916,823.34 |- | -| 3|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |final|**$-2,268,943.17\*\***|$151,009.85 |$150,824.13 |$151,726.30 |$150,816.00 |- |- | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |final|**$-907,570.13**|$569,058.09 |$569,210.35 |$286,911.87 |$398,163.18 |$1,213,773.56 |$629,442.91 | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|$545,633.16 |$737,886.17 |$853,857.46 |$735,942.66 |$1,272,735.86 |$428,074.79 | -| 6|[-](-)|-|- |-|**-**|- |- |- |- |- |- | - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -### Rankings Per Database - -#### Deep1B - -##### Deep1B Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**0.99882**| -| 2|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**0.99821**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**0.99543**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**0.99208**| -| 5|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**0.95736**| -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**0.94275**| - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Deep1B Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**801,694**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**196,546**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**91,701**| -| 4|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**12,927**| -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**10,704**| -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**4,464**| - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Deep1B Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**0.0029**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**0.0041**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**0.0112**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**0.0337**| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**0.1117**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Deep1B Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|---------|-----------------------|--------|-------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |final|**$16,086.82** |$14,664.20|$1,422.62|$14,664.20 |1 |14,226.208| -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia |NVidia GPU |final|**$151,009.85\*\*** |$150,000.00|$1,009.85|$150,000.00 |1 |10,098.482| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia |NVidia GPU |final|**$303,929.39\*\*** |$300,000.00|$3,929.39|$150,000.00 |2 |39,293.902| -| 4|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$545,633.16** |$506,503.70|$39,129.46|$22,021.90 |23 |391,294.584| -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |final|**$569,058.09** |$557,266.60|$11,791.49|$55,726.66 |10 |117,914.908| -| 6|[-](-)|- |- |-|**-** |-|-|- |- |-| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### BigANN - -##### BigANN Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**0.99978** | -| 2|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**0.99976** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**0.99881** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**0.99328** | -| 5|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**0.96750** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**0.93260** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### BigANN Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**747,421** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**335,991** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**80,109** | -| 4|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**19,094** | -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**10,672** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**3,271** | - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### BigANN Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**0.0022**| -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**0.0024**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**0.0119**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**0.0341**| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**0.1576**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### BigANN Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|--------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |final|**$15,439.92** |$14,664.20|$775.72|$14,664.20 |1 |7,757.221| -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia |NVidia GPU |final|**$150,824.13\*\*** |$150,000.00|$824.13|$150,000.00 |1 |8,241.343| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia |NVidia GPU |final|**$304,166.48\*\*** |$300,000.00|$4,166.48|$150,000.00 |2 |41,664.844| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |final|**$569,210.35** |$557,266.60|$11,943.75|$55,726.66 |10 |119,437.537| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$737,886.17** |$682,678.90|$55,207.27|$22,021.90 |31 |552,072.703| -| 6|[-](-)|- |- |-|**-** |-|-|- |- |-| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### MSTuring - -##### MSTuring Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|---------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**0.99568** | -| 2|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**0.99444** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**0.98993** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**0.97841** | -| 5|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**0.96286** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**0.91322** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSTuring Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**584,293** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**161,463** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**109,745** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**21,780** | -| 5|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**17,201** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**2,845** | - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSTuring Power Rankings - -|Rank|Submission |Team |Hardware |Status|W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|------|--------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**0.0048** | -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**0.0049** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**0.0090** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**0.0236** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**0.1743** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSTuring Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|------------------------------------|------------------------------|-----------------------|--------|--------------|--------|--------|---------|--------------|----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**$16,347.45** |$14,664.20|$1,683.25|$14,664.20 |1 |16,832.451 | -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**$151,726.30\*\*** |$150,000.00|$1,726.30|$150,000.00 |1 |17,262.993 | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**$153,151.00\*\*** |$150,000.00|$3,151.00|$150,000.00 |1 |31,509.973 | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**$286,911.87** |$278,633.30|$8,278.57|$55,726.66 |5 |82,785.683 | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**$853,857.46** |$792,788.40|$61,069.06|$22,021.90 |36 |610,690.611 | -| 6|[-](-) |- |- |-|**-** |-|-|- |- |- | - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### MSSpace - -##### MSSpace Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**0.99835** | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**0.99429** | -| 3|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**0.99342** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**0.98622** | -| 5|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**0.97541** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**0.90853** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSSpace Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**839,749** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**155,899** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**108,302** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**16,422** | -| 5|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**6,503** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**3,265** | - -* The operational point for ranking is 0.9 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.9 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSSpace Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**0.0023** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**0.0050** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**0.0090** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**0.0230** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**0.1520** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.9 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### MSSpace Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|-----------------------|------- |--------------|--------|--------|---------|--------------|----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |final|**$16,409.08** |$14,664.20|$1,744.88|$14,664.20 |1 |17,448.764 | -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia |NVidia GPU |final|**$150,816.00\*\*** |$150,000.00|$816.00|$150,000.00 |1 |8,160.006 | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia |NVidia GPU |final|**$153,155.12\*\*** |$150,000.00|$3,155.12|$150,000.00 |1 |31,551.163 | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |final|**$398,163.18** |$390,086.62|$8,076.56|$55,726.66 |7 |80,765.638 | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$735,942.66** |$682,678.90|$53,263.76|$22,021.90 |31 |532,637.584 | -| 6|[-](-)|- |- |-|**-** |-|-|- |- |- | - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### Text2Image - -##### Text2Image Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**0.98130** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**0.97340** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**0.94692** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**0.92855** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**0.86028** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Text2Image Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**19,094** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**17,063** | -| 3|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**9,307** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**4,838** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**1,789** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.860 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.860 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Text2Image Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**0.0446**| -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**0.0480**| -| 3|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**0.1128**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**0.1242**| -| 5|[-](-) |- |- |-|**-**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.86 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.86 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### Text2Image Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|---------------------|------------------------------|---------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**$103,599.49** |$87,985.20|$15,614.29|$14,664.20 |6 |156,142.873| -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**$916,823.34\*\*** |$900,000.00|$16,823.34|$150,000.00 |6 |168,233.421| -| 3|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**$1,213,773.56** |$1,170,259.86|$43,513.70|$55,726.66 |21 |435,137.010| -| 4|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**$1,272,735.86** |$1,233,226.40|$39,509.46|$22,021.90 |56 |395,094.625| -| 5|[-](-) |- |- |-|**-** |-|-|- |- |-| -| 6|[-](-) |- |- |-|**-** |-|-|- |- |-| - -* The operational point for ranking is 0.86 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.86 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### FBSimSearchNet - -##### FBSimSearchNet AP Rankings - -|Rank|Submission |Team |Hardware |Status |AP | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**0.99684** | -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**0.97863** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### FBSimSearchNet Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**9,345** | -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**5,699** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.9 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.9 average precision. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - - -##### FBSimSearchNet Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**0.0469**| -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**0.0904**| -| 3|[-](-) |- |- |-|**-**| -| 4|[-](-) |- |- |-|**-**| -| 5|[-](-) |- |- |-|**-**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.9 average precision. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. - -##### FBSimSearchNet Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|---------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$428,074.79** |$396,394.20|$31,680.59|$22,021.90 |18 |316,805.859| -| 2|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |final|**$629,442.91** |$612,993.26|$16,449.65|$55,726.66 |11 |164,496.451| -| 3|[-](-)|- |- |-|**-** | -| -| -| -| -| -| 4|[-](-)|- |- |-|**-** | -| -| -| -| -| - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.9 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *eval* = final submissions are being evaluated. - * *final* = final submission and ranking. -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. diff --git a/t3/LEADERBOARDS_REJECT_ANOMALIES.md b/t3/LEADERBOARDS_REJECT_ANOMALIES.md deleted file mode 100644 index ab8ce9cef..000000000 --- a/t3/LEADERBOARDS_REJECT_ANOMALIES.md +++ /dev/null @@ -1,571 +0,0 @@ -# T3 Track Leaderboards After Rejecting Anomalies (Unofficial) - -Please note that all rankings are currently unofficial due to the following reasons: -* All [open tasks and issues](TASKS_ISSUES_RESOLUTIONS.md) must be resolved. - -## Final Rankings On Private Query Set - -*Not yet available* - -## Rankings On Public Query Set - -### Rankings By Submission Name (alphabetical) - -|Submission |Team |Hardware |[Recall Rank](#recall-or-ap-rankings)|[Thru-put Rank](#throughput-rankings)|[Power Rank](#power-rankings)|[Cost Rank](#cost-rankings)|Status |Anomalies|Evaluator|Algo |Runs | -|--------------------|-----------|----------|---------|---------|---------|--------|---------|---------|---------|---------|--------| -|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |[1](#recall-or-ap-rankings) |[5](#throughput-rankings) |*NQ* |*NQ* |final |*NA* |Harsha Simhadri |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/diskann-t2.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/EvalPublic.ipynb) | -|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |[6](#recall-or-ap-rankings) |[6](#throughput-rankings) |[5](#power-rankings) |[5](#cost-rankings) |final |0/58 |George Williams |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/faiss_t3.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/EvalPublic.ipynb) | -|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |[4](#recall-or-ap-rankings) |[4](#throughput-rankings) |[4](#power-rankings) |[4](#cost-rankings) |final |0/60 |George Williams |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/gemini.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/EvalPublic.ipynb) | -|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |[3](#recall-or-ap-rankings) |[3](#throughput-rankings) |[1](#power-rankings) |[2](#cost-rankings)\*\* |final |[5/50](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/ANOMALIES.md) |George Williams |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/cuanns_ivfpq.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/EvalPublic.ipynb) | -|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |[5](#recall-or-ap-rankings) |[1](#throughput-rankings) |[3](#power-rankings) |[3](#cost-rankings)\*\* |final |[4/40](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/ANOMALIES.md) |George Williams |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/cuanns_multigpu.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/EvalPublic.ipynb) | -|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |[2](#recall-or-ap-rankings) |[2](#throughput-rankings) |[2](#power-rankings) |[1](#cost-rankings)|final |[5/50](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/ANOMALIES.md) |George Williams |[src](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/benchmark/algorithms/graphann.py) |[nb](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/EvalPublic.ipynb)| - -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - * *NQ* = not qualified - * *NA* = data is not yet available, or has not yet been processed - -* *Anomalies* are defined as queries that could potentially be the result of query response caching, a violation of the competition. Our detection method looks for a 30% or more improvement in the batch query latency between the first and last query of a query group (5). Participants have been given a chance to explain why detected anomalies (if any) are not a result of query response caching. - -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -### Rankings Per Metric - -#### Recall Or AP Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-recall-rankings)|[BigANN](#bigann-recall-rankings)|[MSTuring](#msturing-recall-rankings)|[MSSpace](#msspace-recall-rankings)|[Text2Image](#text2image-recall-rankings)|[FBSSNet](#fbsimsearchnet-ap-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|-------| -| 1|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md)|Microsoft Research India(*org*)|Dell PowerEdge |final|**0.410**|[0.99821](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/deep-1B_recall.png) |[0.99976](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/bigann-1B_recall.png) |[0.99444](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msturing-1B_recall.png) |[0.99342](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msspacev-1B_recall.png) |[0.98130](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/text2image-1B_recall.png) |- | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |final|**0.409**|[0.99882](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_recall.png) |[0.99978](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_recall.png) |[0.99568](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_recall.png) |[0.99835](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_recall.png) |[0.97340](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_recall.png) |- | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |final|**0.368**|[0.99541](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_recall.png) |[0.99882](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_recall.png) |[0.98993](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_recall.png) |[0.99428](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_recall.png) |[0.94691](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_recall.png) |- | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |final|**0.339**|[0.99208](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_recall.png) |[0.99328](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_recall.png) |[0.97841](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_recall.png) |[0.98622](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_recall.png) |[0.92855](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_recall.png) |[0.99684](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_recall.png) | -| 5|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |final|**0.166**|[0.95736](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_recall.png) |[0.96750](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_recall.png) |[0.96286](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_recall.png) |[0.97541](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_recall.png) |- |- | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|[0.94275](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_recall.png) |[0.93260](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_recall.png) |[0.91322](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_recall.png) |[0.90853](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_recall.png) |[0.86028](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_recall.png) |[0.97863](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_recall.png) | - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -#### Throughput Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-throughput-rankings)|[BigANN](#bigann-throughput-rankings)|[MSTuring](#msturing-throughput-rankings)|[MSSpace](#msspace-throughput-rankings)|[Text2Image](#text2image-throughput-rankings)|[FBSSNet](#fbsimsearchnet-throughput-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|--------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |final|**3001623.821**|[816,807](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_throughput.png) |[767,653](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_throughput.png) |[586,722](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_throughput.png) |[844,287](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_throughput.png) |- |- | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |final|**851327.044**|[196,546](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_throughput.png) |[335,991](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_throughput.png) |[161,463](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_throughput.png) |[155,899](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_throughput.png) |[17,063](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_throughput.png) |- | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |final|**401541.475**|[91,938](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_throughput.png) |[85,446](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_throughput.png) |[110,830](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_throughput.png) |[109,621](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_throughput.png) |[19,340](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_throughput.png) |- | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |final|**52429.395**|[10,704](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_throughput.png) |[10,672](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_throughput.png) |[21,780](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_throughput.png) |[16,422](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_throughput.png) |[4,838](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_throughput.png) |[9,345](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_throughput.png) | -| 5|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md)|Microsoft Research India(*org*)|Dell PowerEdge |final|**49398.127**|[12,927](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/deep-1B_throughput.png) |[19,094](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/bigann-1B_throughput.png) |[17,201](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msturing-1B_throughput.png) |[6,503](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msspacev-1B_throughput.png) |[9,307](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/text2image-1B_throughput.png) |- | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|[4,464](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_throughput.png) |[3,271](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_throughput.png) |[2,845](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_throughput.png) |[3,265](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_throughput.png) |[1,789](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_throughput.png) |[5,699](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_throughput.png) | - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -#### Power Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-power-rankings)|[BigANN](#bigann-power-rankings)|[MSTuring](#msturing-power-rankings)|[MSSpace](#msspace-power-rankings)|[Text2Image](#text2image-power-rankings)|[FBSSNet](#fbsimsearchnet-power-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|-----|-----| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |final|**-0.691**|[0.0024](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_power.png) |[0.0023](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_power.png) |[0.0016](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_power.png) |[0.0017](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_power.png) |[0.0094](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_power.png)|-| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |final|**-0.648**|[0.0041](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_power.png) |[0.0022](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_power.png) |[0.0048](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_power.png) |[0.0050](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_power.png) |[0.0446](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_power.png)|-| -| 3|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |final|**-0.594**|[0.0002](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_power.png) |[0.0003](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_power.png) |[0.0004](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_power.png) |[0.0002](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_power.png) |-|-| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |final|**-0.513**|[0.0337](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_power.png) |[0.0341](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_power.png) |[0.0236](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_power.png) |[0.0230](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_power.png) |[0.1242](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_power.png)|[0.0469](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_power.png)| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|[0.1117](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_power.png) |[0.1576](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_power.png) |[0.1743](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_power.png) |[0.1520](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_power.png) |[0.1128](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_power.png)|[0.0904](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_power.png)| -| 6|[-](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|-|- |-|**-**|- |- |- |- |-|-| - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -#### Cost Rankings - -|Rank|Submission |Team |Hardware|Status |Score |[Deep1B](#deep1B-cost-rankings)|[BigANN](#bigann-cost-rankings)|[MSTuring](#msturing-cost-rankings)|[MSSpace](#msspace-cost-rankings)|[Text2Image](#text2image-cost-rankings)|[FBSSNet](#fbsimsearchnet-cost-rankings)| -|----|------------------|-------|--------|-------|-----------|------|------|--------|-------|----------|--------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel|Intel Optane |final|**$-3,978,172.56**|$16,086.82 |$15,439.92 |$16,347.45 |$16,409.08 |$103,599.49 |- | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia|NVidia GPU |final|**$-2,339,919.09\*\***|$300,843.83 |$300,815.92 |$150,563.49 |$150,605.68 |$903,307.30 |- | -| 3|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia|NVidia GPU |final|**$-2,272,942.67\*\***|$150,082.04 |$150,088.58 |$150,127.39 |$150,078.78 |- |- | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*)|LedaE APU |final|**$-907,570.13**|$569,058.09 |$569,210.35 |$286,911.87 |$398,163.18 |$1,213,773.56 |$629,442.91 | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*)|NVidia GPU |final|**baseline**|$545,633.16 |$737,886.17 |$853,857.46 |$735,942.66 |$1,272,735.86 |$428,074.79 | -| 6|[-](-)|-|- |-|**-**|- |- |- |- |- |- | - -* A submission must support at least 3 databases to qualify for this ranking. -* The ranking is based on the score, which is the sum of benchmark improvements of qualifying databases (shown in specific database columns after the score column.) -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -### Rankings Per Database - -#### Deep1B - -##### Deep1B Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.99882](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_recall.png)**| -| 2|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[0.99821](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/deep-1B_recall.png)**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.99541](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_recall.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.99208](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_recall.png)**| -| 5|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.95736](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_recall.png)**| -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.94275](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_recall.png)**| - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Deep1B Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[816,807](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_throughput.png)**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[196,546](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_throughput.png)**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[91,938](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_throughput.png)**| -| 4|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[12,927](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/deep-1B_throughput.png)**| -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[10,704](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_throughput.png)**| -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[4,464](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_throughput.png)**| - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Deep1B Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.0002](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/deep-1B_power.png)**| -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.0024](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/deep-1B_power.png)**| -| 3|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.0041](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/deep-1B_power.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.0337](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/deep-1B_power.png)**| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1117](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/deep-1B_power.png)**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Deep1B Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|---------|-----------------------|--------|-------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |final|**$16,086.82** |$14,664.20|$1,422.62|$14,664.20 |1 |14,226.208| -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia |NVidia GPU |final|**$150,082.04\*\*** |$150,000.00|$82.04|$150,000.00 |1 |820.405| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia |NVidia GPU |final|**$300,843.83\*\*** |$300,000.00|$843.83|$150,000.00 |2 |8,438.315| -| 4|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$545,633.16** |$506,503.70|$39,129.46|$22,021.90 |23 |391,294.584| -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |final|**$569,058.09** |$557,266.60|$11,791.49|$55,726.66 |10 |117,914.908| -| 6|[-](-)|- |- |-|**-** |-|-|- |- |-| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### BigANN - -##### BigANN Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.99978](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_recall.png)** | -| 2|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[0.99976](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/bigann-1B_recall.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.99882](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_recall.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.99328](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_recall.png)** | -| 5|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.96750](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_recall.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.93260](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_recall.png)** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### BigANN Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[767,653](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[335,991](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_throughput.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[85,446](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_throughput.png)** | -| 4|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[19,094](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/bigann-1B_throughput.png)** | -| 5|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[10,672](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_throughput.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[3,271](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_throughput.png)** | - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### BigANN Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.0003](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/bigann-1B_power.png)**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.0022](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/bigann-1B_power.png)**| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.0023](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/bigann-1B_power.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.0341](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/bigann-1B_power.png)**| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1576](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/bigann-1B_power.png)**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### BigANN Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|--------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |final|**$15,439.92** |$14,664.20|$775.72|$14,664.20 |1 |7,757.221| -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia |NVidia GPU |final|**$150,088.58\*\*** |$150,000.00|$88.58|$150,000.00 |1 |885.770| -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia |NVidia GPU |final|**$300,815.92\*\*** |$300,000.00|$815.92|$150,000.00 |2 |8,159.226| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |final|**$569,210.35** |$557,266.60|$11,943.75|$55,726.66 |10 |119,437.537| -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$737,886.17** |$682,678.90|$55,207.27|$22,021.90 |31 |552,072.703| -| 6|[-](-)|- |- |-|**-** |-|-|- |- |-| - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### MSTuring - -##### MSTuring Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|---------------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.99568](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_recall.png)** | -| 2|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[0.99444](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msturing-1B_recall.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.98993](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_recall.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.97841](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_recall.png)** | -| 5|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.96286](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_recall.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.91322](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_recall.png)** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSTuring Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[586,722](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[161,463](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_throughput.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[110,830](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_throughput.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[21,780](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_throughput.png)** | -| 5|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[17,201](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msturing-1B_throughput.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[2,845](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_throughput.png)** | - -* The operational point for ranking is 0.90 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSTuring Power Rankings - -|Rank|Submission |Team |Hardware |Status|W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|------|--------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.0004](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msturing-1B_power.png)** | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.0016](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msturing-1B_power.png)** | -| 3|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.0048](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msturing-1B_power.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.0236](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msturing-1B_power.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1743](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msturing-1B_power.png)** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.90 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSTuring Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|------------------------------------|------------------------------|-----------------------|--------|--------------|--------|--------|---------|--------------|----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**$16,347.45** |$14,664.20|$1,683.25|$14,664.20 |1 |16,832.451 | -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**$150,127.39\*\*** |$150,000.00|$127.39|$150,000.00 |1 |1,273.870 | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**$150,563.49\*\*** |$150,000.00|$563.49|$150,000.00 |1 |5,634.885 | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**$286,911.87** |$278,633.30|$8,278.57|$55,726.66 |5 |82,785.683 | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**$853,857.46** |$792,788.40|$61,069.06|$22,021.90 |36 |610,690.611 | -| 6|[-](-) |- |- |-|**-** |-|-|- |- |- | - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### MSSpace - -##### MSSpace Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.99835](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_recall.png)** | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.99428](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_recall.png)** | -| 3|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[0.99342](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msspacev-1B_recall.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.98622](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_recall.png)** | -| 5|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.97541](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_recall.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |$MS6r_ST|**[0.90853](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_recall.png)** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSSpace Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[844,287](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[155,899](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_throughput.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[109,621](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_throughput.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[16,422](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_throughput.png)** | -| 5|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[6,503](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/msspacev-1B_throughput.png)** | -| 6|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[3,265](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_throughput.png)** | - -* The operational point for ranking is 0.9 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.9 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSSpace Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md) |NVidia |NVidia GPU |final|**[0.0002](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_multigpu/msspacev-1B_power.png)** | -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.0017](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/msspacev-1B_power.png)** | -| 3|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.0050](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/msspacev-1B_power.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.0230](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/msspacev-1B_power.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1520](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/msspacev-1B_power.png)** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.9 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### MSSpace Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|-----------------------|------- |--------------|--------|--------|---------|--------------|----------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md)|Intel |Intel Optane |final|**$16,409.08** |$14,664.20|$1,744.88|$14,664.20 |1 |17,448.764 | -| 2|[cuanns_multigpu](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_multigpu/README.md)|NVidia |NVidia GPU |final|**$150,078.78\*\*** |$150,000.00|$78.78|$150,000.00 |1 |787.774 | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md)|NVidia |NVidia GPU |final|**$150,605.68\*\*** |$150,000.00|$605.68|$150,000.00 |1 |6,056.841 | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |final|**$398,163.18** |$390,086.62|$8,076.56|$55,726.66 |7 |80,765.638 | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$735,942.66** |$682,678.90|$53,263.76|$22,021.90 |31 |532,637.584 | -| 6|[-](-)|- |- |-|**-** |-|-|- |- |- | - -* The operational point for ranking is 0.90 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.90 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### Text2Image - -##### Text2Image Recall Rankings - -|Rank|Submission |Team |Hardware |Status |R@10 | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[0.98130](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/text2image-1B_recall.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.97340](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_recall.png)** | -| 3|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.94691](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_recall.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.92855](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_recall.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.86028](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_recall.png)** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Text2Image Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[19,340](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_throughput.png)** | -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[17,063](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_throughput.png)** | -| 3|[diskann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/diskann-bare-metal/README.md) |Microsoft Research India(*org*) |Dell PowerEdge |final|**[9,307](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/diskann-bare-metal/text2image-1B_throughput.png)** | -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[4,838](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_throughput.png)** | -| 5|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[1,789](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_throughput.png)** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.860 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.860 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Text2Image Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**[0.0094](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/cuanns_ivfpq/text2image-1B_power.png)**| -| 2|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**[0.0446](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/optanne_graphann/text2image-1B_power.png)**| -| 3|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.1128](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/text2image-1B_power.png)**| -| 4|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.1242](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/text2image-1B_power.png)**| -| 5|[-](-) |- |- |-|**-**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.86 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.86 recall@10. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### Text2Image Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|---------------------|------------------------------|---------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[optanne_graphann](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/optanne_graphann/README.md) |Intel |Intel Optane |final|**$103,599.49** |$87,985.20|$15,614.29|$14,664.20 |6 |156,142.873| -| 2|[cuanns_ivfpq](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/cuanns_ivfpq/README.md) |NVidia |NVidia GPU |final|**$903,307.30\*\*** |$900,000.00|$3,307.30|$150,000.00 |6 |33,072.963| -| 3|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**$1,213,773.56** |$1,170,259.86|$43,513.70|$55,726.66 |21 |435,137.010| -| 4|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**$1,272,735.86** |$1,233,226.40|$39,509.46|$22,021.90 |56 |395,094.625| -| 5|[-](-) |- |- |-|**-** |-|-|- |- |-| -| 6|[-](-) |- |- |-|**-** |-|-|- |- |-| - -* The operational point for ranking is 0.86 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.86 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. - -#### FBSimSearchNet - -##### FBSimSearchNet AP Rankings - -|Rank|Submission |Team |Hardware |Status |AP | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-------------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.99684](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_recall.png)** | -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.97863](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_recall.png)** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 2000 QPS. We will use the highest recall for the search parameters that meet or exceed 2000 QPS. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### FBSimSearchNet Throughput Rankings - -|Rank|Submission |Team |Hardware |Status |Q/S | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|------------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[9,345](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_throughput.png)** | -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[5,699](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_throughput.png)** | -| 3|[-](-) |- |- |-|**-** | -| 4|[-](-) |- |- |-|**-** | -| 5|[-](-) |- |- |-|**-** | -| 6|[-](-) |- |- |-|**-** | - -* The operational point for ranking is 0.9 recall@10. We will use the highest throughput for the search parameters that meet or exceed 0.9 average precision. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - - -##### FBSimSearchNet Power Rankings - -|Rank|Submission |Team |Hardware |Status |W*S/Q | -|----|-------------------------------------------------------|------------------------------|-----------------------|--------|-----------| -| 1|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md) |GSI Technology(*org*) |LedaE APU |final|**[0.0469](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/gemini/ssnpp-1B_power.png)**| -| 2|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md) |Facebook Research(*org*) |NVidia GPU |final|**[0.0904](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/eval_2021/faiss_t3/ssnpp-1B_power.png)**| -| 3|[-](-) |- |- |-|**-**| -| 4|[-](-) |- |- |-|**-**| -| 5|[-](-) |- |- |-|**-**| -| 6|[-](-) |- |- |-|**-**| - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption for the search parameters that meet or exceed 0.9 average precision. -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress - -##### FBSimSearchNet Cost Rankings - -|Rank|Submission |Team |Hardware |Status |Cost |capex |opex |unit cost|units@100K qps|KwH*4yrs | -|----|--------------------|------------------------------|---------------------|--------|--------------|--------|--------|---------|--------------|---------| -| 1|[faiss_t3](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/faiss_t3/README.md)|Facebook Research(*org*) |NVidia GPU |final|**$428,074.79** |$396,394.20|$31,680.59|$22,021.90 |18 |316,805.859| -| 2|[gemini](https://github.com/harsha-simhadri/big-ann-benchmarks/blob/gw/T3/t3/gemini/README.md)|GSI Technology(*org*) |LedaE APU |final|**$629,442.91** |$612,993.26|$16,449.65|$55,726.66 |11 |164,496.451| -| 3|[-](-)|- |- |-|**-** | -| -| -| -| -| -| 4|[-](-)|- |- |-|**-** | -| -| -| -| -| - -* The operational point for ranking is 0.9 recall@10. We will use the lowest power consumption/query for the search parameters that meet or exceed 0.9 recall@10. -* The formula is based on: - * Take the algorithm's throughput submitted to leaderboard, use it to scale no. of systems needed to scale to 100K qps (using ceiling to round up any decimal.) - * Capex = cost per system * scale no. - * Take w*s/q from algorithm's power metric submitted to leaderboard and convert to KwH/q. - * Multiply by total queries at 100K qps for 4 years = 4x365x24x60x60x100000 total queries over 4 years. - * Opex = (total queries over 4 years) * KwH/query * $0.10/KwH -* Abbreviations used in chart: - * *org* = submitted by challenge organizer, so subject to competition restrictions - * *final* = final submission - * *inprog* = algorithm development still in progress -* \*\*Nvidia has not yet approved the MSRP cost used for ranking, so participation in this benchmark is still pending. diff --git a/t3/RANKING.md b/t3/RANKING.md deleted file mode 100644 index 1d8bc88c9..000000000 --- a/t3/RANKING.md +++ /dev/null @@ -1,196 +0,0 @@ -# Explanation of T3 Ranking Method - -This readme outlines the ranking logic used for the T3 track of this competition. - -## Benchmarks - -We measure participants on 4 benchmarks and we maintain a leaderboard for each: -* recall/average precision - recall is based on recall@10 accounting for distance ties -* throughput - based on queries/second -* power consumption - based on measuring watt*seconds/query -* cost - based on a projection of capex + opex - -## Ranking Score - -For each benchmark/leaderboard, we will compute an aggregate score based on the teams's performance on each participating dataset. - -A team must participate in at least 3 datasets to qualify for the competition. - -A team fails to qualify for a dataset if either 1) their algorithm does not support that dataset 2) the performance of their algorithm does not meet the threshold for that dataset (see below) for a benchmark that implements thresholds. - -The score on each participating dataset is based on the difference between the team's performance on that dataset and the performance of the baseline (see below). - -The team's final ranking score for a benchmark is the sum of individual participating dataset scores. - -In this way, teams that participate in more datasets can get an advantage. - -## Thresholds - -We implement thresholds for the recall/average precision and throughput benchmark/leaderboards. - -The thresholds are listed below for each dataset: - -|Dataset |R@10/AP |Throughput(qps) | -|-------------------|-----------|----------------| -|deep-1B |0.9 |2000 | -|bigann-1B |0.9 |2000 | -|msturing-1B |0.9 |2000 | -|msspacev-1B |0.0 |2000 | -|text2image-1B |0.86 |1762.363 | -|ssnpp-1B |0.9 |2000 | - -## Thresholds Explained - -We had to decide very early in the planning of this competition reasonable performance thresholds to implement. - -We observed that the performance of the T3 baseline algorithm (see below) was achieving at least 90% recall@10 at 2000qps for several datasets, so we decided to bake this into the competition rules. As our internal testing evolved we discovered that 1 dataset (text2image-1B) could not achieve those thresholds, and so we decided to lower the threshold based on the baseline performance we observed at that time. - -# Baseline - -## Algorithm and Hardware - -The baseline algorithm is based on FAISS library version 1.7.1. The FAISS library provides several ANN approaches and the baselined leverages the FAISS index called "IVF1048576,SQ8." The choice of this index was based on experimentation and consultation with Mathijs Douje of Facebook, one of the competition organizers. You can view the algorithm [here]. - -The hardware is 1 PCIe V100 NVidia GPU attached to an Advantech SKY motherboard with 768 GB RAM. More details about the hardware can be found [here](faiss_t3/README.md). - -## Threshold - -The baseline algorithm informed the track thresholds as explained in the Thresholds section above. - -## Scoring - -The performance of the baseline algorithm factors into the scoring used to rank participants, as explained in the Ranking Score section above. - -The benchmarks used in the score calculation are listed below for each dataset: - -|Dataset |Recall@10/AP|Throughput(qps) |Cost(wspq) | -|-------------------|------------|----------------|-----------| -|deep-1B |0.943 |4417.036 |0.113 | -|bigann-1B |0.927 |3086.656 |0.167 | -|msturing-1B |0.909 |2359.485 |0.204 | -|msspacev-1B |0.909 |2770.848 |0.167 | -|text2image-1B |0.860 |1762.363 |0.123 | -|ssnpp-1B |0.979 |5572.272 |0.095 | - -## Measurements - -The baseline benchmarks are based on the most recent measurements. At the start, and during the competition, we had published different numbers. The reason for the changes are described in [Appendix A](#appendix-a) below. - -# Appendix - -## Appendix A - -At the start of the competition, we had release the following thresholds: - -|Dataset |R@10/AP |Throughput(qps) | -|-------------------|-----------|----------------| -|deep-1B |0.9 |2000 | -|bigann-1B |0.9 |2000 | -|msturing-1B |0.9 |2000 | -|msspacev-1B |0.85 |1484.217 | -|text2image-1B |0.86 |1510.624 | -|ssnpp-1B |0.9 |2000 | - -The most recent thresholds have changed from the original for the following reasons: -* Changes in how recall was computing to deal with ties in distance. -* Changes in the radius for the range search dataset -* Also we decided to re-run the measurements of the baseline algorithm on the T3 baseline machine using the current evaluation framework. The original baselines were measured using a different software framework -* The original baselines published did not calculate and report baseline cost. - -The original baselines that were published are shown below. For recall: - -| dataset | qps | recall@10 | -| ------------ | -------- | --------- | -| msturing-1B | 2011.542 | 0.910 | -| bigann-1B | 2058.950 | 0.927 | -| text2image-1B| 2120.635 | 0.860 | -| deep-1B | 2002.490 | 0.942 | -| msspacev-1B | 2190.829 | 0.850 | - -And for throughput: - -| dataset | qps | recall@10 | -| ------------ | -------- | --------- | -| msturing-1B | 2421.856 | 0.902 | -| bigann-1B | 2186.755 | 0.905 | -| text2image-1B| 1510.624 | 0.882 | -| deep-1B | 3422.473 | 0.916 | -| msspacev-1B | 1484.217 | 0.869 | - -The following tables show the baseline performance on the range search dataset: - -Instead of recall, the range search dataset utilizes average precision: - -| dataset | qps | ap -| -----------| ---------| --------- -| ssnpp-1B | 2907.414 | 0.979 - -For throughput: - -| dataset | qps | ap | -| -----------| -------- | --------- | -| ssnpp-1B | 5572.272 | 0.910 | - -Here were the published baselines for power: - -| dataset | power(wspq) | -| ------------ | ------------| -| msturing-1B | 0.203740 | -| bigann-1B | 0.167123 | -| text2image-1B| 0.089675 | -| deep-1B | 0.112581 | -| msspacev-1B | 0.099569 | -| ssnpp-1B | 0.0944865 | - - -The following table lists the full measurements for baseline performance experiments that informed the original baselines (only recall and throughput are shown.) - -| dbase| throughtput(qps)| recall@10| -|-------------------|--------------------|---------------------| -| bigann-1B| 2186.754570| 0.904860| -| bigann-1B| 1926.901416| 0.911140| -| bigann-1B| 1657.226695| 0.919860| -| bigann-1B| 2058.950046| 0.926560| -| bigann-1B| 1931.042641| 0.932450| -| bigann-1B| 1770.748406| 0.937190| -| bigann-1B| 1609.052224| 0.941330| -| bigann-1B| 1504.748288| 0.943890| -| text2image-1B| 2607.779941| 0.834820| -| text2image-1B| 2456.621393| 0.841845| -| text2image-1B| 2285.966847| 0.851920| -| text2image-1B| 2120.635218| 0.860156| -| text2image-1B| 1917.445903| 0.867244| -| text2image-1B| 1748.662912| 0.873469| -| text2image-1B| 1612.313130| 0.878757| -| text2image-1B| 1510.624227| 0.882487| -| msspacev-1B| 2465.473370| 0.844805| -| msspacev-1B| 2190.828587| 0.850205| -| msspacev-1B| 1935.385102| 0.854864| -| msspacev-1B| 1931.506970| 0.858998| -| msspacev-1B| 1748.525911| 0.862437| -| msspacev-1B| 1585.766679| 0.865152| -| msspacev-1B| 1477.389358| 0.867912| -| msspacev-1B| 1484.216732| 0.868812| -| msturing-1B| 3625.040250| 0.881202| -| msturing-1B| 3197.403722| 0.888140| -| msturing-1B| 2907.993722| 0.893669| -| msturing-1B| 2655.951474| 0.898400| -| msturing-1B| 2421.855941| 0.902413| -| msturing-1B| 2233.241641| 0.905846| -| msturing-1B| 2070.942269| 0.908949| -| msturing-1B| 2011.542149| 0.910115| -| deep-1B| 3422.472565| 0.915540| -| deep-1B| 2732.133452| 0.920430| -| deep-1B| 2507.486404| 0.927790| -| deep-1B| 1992.323615| 0.932950| -| deep-1B| 2037.783443| 0.937940| -| deep-1B| 2002.489712| 0.941740| -| deep-1B| 1967.826369| 0.945130| -| deep-1B| 1874.898854| 0.947430| - -These baseline numbers were performed on the machine configuration used for the T3 faiss baseline. - -An older (now obsolete) code framework was used to determine these thresholds, not the existing evaluation framework so unfortunately there is no algos.yaml configuration file. - - - diff --git a/t3/README.md b/t3/README.md deleted file mode 100644 index 0f9969c50..000000000 --- a/t3/README.md +++ /dev/null @@ -1,355 +0,0 @@ -# T3 Track - -## Table Of Contents - -- [Introduction](#introduction) -- [For Participants](#for_participants) - - [Getting Started](#getting_started) - - [Starting Your Development](#starting_your_development) - - [Developing Your Dockerfile](#developing_your_dockerfile) - - [Developing Your Algorithm](#developing_your_algorithm) - - [Submitting Your Algorithm](#submitting_your_algorithm) - - [How To Get Help](#how_to_get_help) - - [Leaderboard Ranking](#leaderboard_ranking) - - [Baseline Performance](#baseline_performance) - - [Recall/Average Precision Leaderboard](#recall/average_precision_leaderboard) - - [Throughput Leaderboard](#throughput_leaderboard) - - [Power Leaderboard](#power_leaderboard) - - [Cost Leaderboard](#cost_leaderboard) -- [For Evaluators](#for_organizers) - - [Evaluating Participant Algorithms](#evaluating_participant_algorithms) - - [Participant Sends Hardware To Evaluators](#participant_sends_hardware_to_organizers) - - [Participant Gives Remote Access To Evaluators](#participant_gives_remote_access_to_organizer) - - [Participant Runs And Submits Benchmarks](#participant_runs_and_submits_benchmark) - - [Evaluating Power Consumption](#evaluating_power_consumption) - -## Introduction - -The T1 and T2 tracks of the competition restrict the evaluation of algorithms to standard Azure CPU servers with 64GB of RAM and 2TB of SSD. The only restriction in the T3 track is that the evaluation machine can be any hardware that is commercially available ( including any commercially available add-on PCIe boards ). T3 will maintain four leaderboards: -* One based on recall/average precision -* One based on throughput -* One based on power consumption -* One based on hardware cost - -You can see the latest leaderboards' status [here](LEADERBOARDS.md). - -Participants must submit their algorithm via a pull request and index file(s) upload (one per participating dataset). Participants are not required to submit proprietary source code such as software drivers or firmware. - -Competition evaluators will evaluate the participant's algorithm and hardware via one of these options: -* Participants send their hardware to the organizers at the participant's expense. -* Participants give organizers remote access to the hardware. -* Participants run the evaluation benchmarks on their own, and send the results to the organizers. - -## For_Participants - -### Requirements - -You will need the following installed on your machine: -* Python ( we tested with Anaconda using an environment created for Python version 3.8.5 ) -* Note that we tested everything on Ubuntu Linux 18.04 but other environments should be possible. -* It's assumed that all the software drivers and services need to support your hardware are installed on development machines. For example, to run the T3 baseline, your system must have a Cuda 11 compatibile GPU, Cuda 11.0, and the cuda 11.0 docker run-time installed. See the T3 baseline [installation instructions](faiss_t3/README.md). Cuda versions greater than 11.0 should be possible, but weren't tested. - -### Getting_Started - -This section will present a small tutorial about how to use this framework and several of the key scripts you will use throughout the development of your algorithm and eventual submission. - -First, clone this repository and cd into the project directory: -``` -git clone -``` -Install the python package requirements: -``` -pip install -r requirements.txt -``` -Create a small, sample dataset: -``` -python create_dataset.py --dataset random-xs -``` -Build the docker container for the T3 baseline: -``` -python install.py --dockerfile t3/faiss_t3/Dockerfile -``` -Run a benchmark evaluation using the algorithm's definition file: -``` -python run.py --t3 --definitions t3/faiss_t3/algos.yaml --dataset random-xs -``` -Please note that the *--t3* flag is important. - -Now analyze the results: -``` -python plot.py --definitions t3/faiss_t3/algos.yaml --dataset random-xs -``` -This will place a plot of the algorithms performance, recall/average_precision-vs-throughput, into the *results/* directory. - -### Starting_Your_Development - -First, please create a short name for your team without spaces or special characters. Henceforth in these instructions, this will be referenced as [your_team_name]. - -Create a custom branch off main in this repository: -``` -git checkout -b t3/[your_team_name] -``` -In the *t3/* directory, create a sub-directory using that name. -``` -mkdir t3/[your_team_name] -``` - -### Developing_Your_Dockerfile - -This framework evaluates algorithms in Docker containers by default. Your algorithm's Dockerfile should live in your team's subdirectory at *t3/[your_team_name]*. Ideally, your Docker file should contain everything needed to install and run your algorithm on a system with the same hardware. Given the nature of T3, this will not likely be entirely possible since custom hardware host drivers and certain low level host libraries require an installation step outside of what can be accomplished with Docker alone. Please make your best effort to include as much installation and setup within your Docker container, as we want to promote as much transparency as possible among all participants. - -Please consult the Dockerfile [here](faiss_t3/Dockerfile) for an example. - -To build your Docker container, run: -``` -python install.py --dockerfile t3/[your_team_name]/Dockerfile -``` - -### Developing_Your_Algorithm - -Develop and add your algorithm's python class to the [benchmark/algorithms](../benchmark/algorithms) directory. -* You will need to subclass from the [BaseANN class](../benchmark/algorithms/base.py) and implement the functions of that parent class. -* You should consult the examples already in the directory. - -As you develop and test your algorithm, you will likely need to test on smaller datasets. This framework provides a way to create datasets of various sizes. For example, to create a dataset with 10000 20-dimensional random floating point vectors, run: -``` -python create_dataset.py --dataset random-xs -``` -To see a complete list of datasets, run the following: -``` -python create_dataset.py --help -``` -When you are ready to test on the competition datasets, use the create_dataset.py script as follows: -``` -python create_dataset.py --dataset [sift-1B|bigann-1B|text2image-1B|msturing-1B|msspacev-1B|ssnpp-1B] -``` -To benchmark your algorithm, first create an algorithm configuration yaml in your teams directory called *algos.yaml.* This file contains the index build parameters and query parameters that will get passed to your algorithm at run-time. Please look at [this example](faiss_t3/algos.yaml). - -Now you can benchmark your algorithm using the run.py script: -``` -python run.py --t3 --definitions t3/[your_team_name]/algos.yaml --dataset random-xs -``` -This will write the results to the toplevel [results](../results) directory. - -Now you can analyze the results by running: -``` -python plot.py --definitions t3/[your_team_name]/algos.yaml --dataset random-xs -``` -This will place a plot of the algorithms performance, recall/average_precision-vs-throughput, into the toplevel [results](../results) directory. - -The plot.py script supports other benchmarks. To see a complete list, run: -``` -python plot.py --help -``` - -### Submitting_Your_Algorithm - -A submission is composed of the following: -* 1 index binary file(s) for each dataset for which you are participating (see *Index File* section below.) -* 1 *algos.yaml* with only one set of build parameters and at most 10 sets of query parameters for each dataset in which you are participating. Please put that file into the *t3/[your_team_name]/* directory. -* Your algorithm's python class ( placed in the [benchmark/algorithms/](../benchmark/algorithms) directory.) -* 1 README file with specific information about your hardware and software (see *README File* section below.) -* Evidence of the cost of your hardware components (see *README File* section below.) -* Optional information (see *Optional Information* section below.) - -### Index File - -The binary index file(s) must be http or azcopy accessible and is referenced within your *t3/[your_team_name]/algos.yaml* config file. Please see the baseline [algos.yaml](faiss_t3/algos.yaml) example. - -### The README File - -Your submission's top-level directory should contain a README.md with the following sections: -* **Hardware Configuration And Cost** This section must contain a table that breaks down the hardware components of your system and the cost. Each entry should link to evidence of the component cost. -* **Hardware Access** This section describes how evaluators acquire access to the hardware (specific instructions or contact information.) -* **No Source Declarations** This section must contain a list of software components that were not provided with the submission. -* **Hardware Setup And Software Installation** This section should contain any hardware and software installation instructions. -* **Run Competition Algorithm** This section should contain instructions to run the competition algorithm, for example, run scripts. - -Please consult the baseline [README](faiss_t3/README.md) example. - -### Optional Information - -Please feel free to append sections to the base README requirements. For example, you can include other benchmarks of interest. - -### How_To_Get_Help - -There are several ways to get help as you develop your algorithm using this framework: -* You can submit an issue at this github repository. -* Send an email to the competition's T3 organizer, gwilliams@gsitechnology.com -* Send en email to the competition's googlegroup, big-ann-organizers@googlegroups.com - -### Leaderboard_Ranking - -T3 will maintain four different leaderboards 1) one based on recall/average precision 2) one based on throughput 3) one based on power consumption and 4) one based on cost. The details of the ranking metrics are described here. - -#### Baseline_Performance - -A performance baseline has been established for this competition, based on both queries per second (qps) and recall/average precision (recall measured as recall@10.) For the recall leaderboard, we will rank participants by recall@10/average precision at 2K qps. - -The table below shows the baseline recall@10 for all the (knn search type) datasets at or above 2K qps ( or as close to it as possible. ) - -| dataset | recall@10 | -| ------------ | --------- | -| msturing-1B | 0.909 | -| bigann-1B | 0.927 | -| text2image-1B| 0.860 | -| deep-1B | 0.943 | -| msspacev-1B | 0.909 | - -For the throughput leaderboard, we will rank participants by qps at or above 90% recall@10 (or close to it as possible.) The table below shows the baseline throughput for all the (knn search type) datasets near 90% recall@10. - -| dataset | qps | -| ------------ | -------- | -| msturing-1B | 2359.485 | -| bigann-1B | 3086.656 | -| text2image-1B| 1762.363 | -| deep-1B | 4417.036 | -| msspacev-1B | 2770.848 | - -The following tables show the baseline performance on the range search dataset: - -Instead of recall, the range search dataset utilizes average precision: - -| dataset | ap | -| -----------| -------| -| ssnpp-1B | 0.979 | - -For throughput: - -| dataset | qps | -| -----------| -------- | -| ssnpp-1B | 5572.272 | - -The following table shows the baseline performance on all datasets for power, shown as watt-seconds/query: - -| dataset | wspq | -| ------------ | -------- | -| msturing-1B | 0.204 | -| bigann-1B | 0.167 | -| text2image-1B| 0.123 | -| deep-1B | 0.113 | -| msspacev-1B | 0.167 | -| ssnpp-1B | 0.095 | - -The following table shows the baseline performance on all datasets for cost: - -| dataset | cost | -| ------------ | --------------- | -| msturing-1B | $1,018,332.30 | -| bigann-1B | $785,282.45 | -| text2image-1B| $1,298,436.77 | -| deep-1B | $545,952.10 | -| msspacev-1B | $873,460.84 | -| ssnpp-1B | $429,634.84 | - -Details of how power is measured and how cost is computed are explained further down. - -Baselines were measured on an 56 core Intel Xeon system with 700GB RAM and a V100 Nvidia GPU using the FAISS library using the index strategy called IVF1048576,SQ8. - -Please consult [this document](RANKING.md) for a detailed discussion about how the baseline is used to inform competition thresholds and participant scoring, as well as recent developments on baseline performance. - -#### Recall/Average_Precision_Leaderboard - -This leaderboard leverages the standard recall@10 vs throughput benchmark that has become a standard benchmark when evaluating and comparing approximate nearest neighbor algorithms. We will rank participants based on recall@10/average_precision at 2K qps por each dataset. The evaluation framework allows for 10 different search parameter sets and we will use the best value of recall@10 from the set. - -The final ranking will be based on a computed score, which is the sum of the improvements in recall over the baseline for the participating databases. A submission must participate in at least 3 databases. - -Participants that cannot meet or exceed the 2000 qps minimum threshold ( or 1762.363 qps for Text2Image ) for a dataset will be dropped from ranking consideration for that dataset. - -Please consult [this document](RANKING.md) for a detailed discussion about how the baseline is used to inform competition thresholds and participant scoring. - -#### Throughput_Leaderboard - -This leaderboard also leverages the standard recall@10 vs throughput benchmark. We will rank participants based on throughput (qps) at the recall@10 threshold of 90%. The evaluation framework allows for 10 different search parameter sets and we will use the best value of throughput from the set. - -The final ranking will be based on a computed score, which is the sum of the improvements in throughput over the baseline for the participating databases. A submission must participate in at least 3 databases. - -Please consult [this document](RANKING.md) for a detailed discussion about how the baseline is used to inform competition thresholds and participant scoring. - -#### Power_Leaderboard - -This leaderboard is related to power consumption, which is an important consideration when scaling applications and servers in a datacenter. The primary ranking metric is ( kilowatt-hour / query.) Participants must meet or exceed the recall@10 and 2000QPS minimum threshold ( for Text2Image, the baseline performance is the minimum threshold.) The reason for those minimum thresholds is to discourage algorithm’s designers from purposefully sacrificing too much performance in order to lower the power consumption. - -The evaluation framework leverages the power sensors available in the standard IPMI power management interface of most commercial server chassis’. We also leverage the open source project ipmicap ( https://github.com/fractalsproject/ipmicap ) to capture the power sensors and calculate the power consumption. - -During evaluation, for each search parameter set, power consumption is acquired over at least 10 seconds running search on the entire query set. During that 10 seconds, multiple consecutive runs on the query set may occur in order to maintain a minimum duration of 10 seconds. Also, the duration may be greater than 10 seconds if a run of 1 query set takes longer than 10 seconds. So a run could be composed of 1 batch query or several and the duration will be at least 10 seconds The power consumption acquired for the run is divided by the total number of queries performed during the run, resulting in ( kilowatt-hour / query ). Up to 10 search parameter sets are allowed, and we use the minimum value for ranking participants, for each dataset. - -The final ranking will be based on a computed score, which is the sum of the improvements in power consumption over the baseline for the participating databases. A submission must participate in at least 3 databases. - -There are no direct thresholds for this benchmark/leaderboard. Indirectly, participants that cannot meet or exceed the recall@10 threshold ( or 0.86 for Text2Image ) for a dataset will be dropped from ranking consideration for that dataset. Scoring will be based on the baseline performance for power consumption, shown here for each dataset: - -Please consult [this document](RANKING.md) for a detailed discussion about how the baseline is used to inform participant scoring for this benchmark. - -#### Cost_Leaderboard - -This leaderboard is related to cost, which is an important consideration when scaling applications and servers in a datacenter. The primary ranking metric will be an estimate of capital expense (capex) + operational expense (opex) that is required to scale the participant’s system to 100,000 qps that meets or exceeds the baseline recall@10. - -The formula for the capex estimate is as follows: - -capex = (MSRP of all the hardware components of the system ) X ( minimum number of systems needed to scale to support 100,000 qps ) - -The hardware components include the chassis and all of the electronics within the chassis including the power supplies, motherboard, HDD/SSD, and all extension boards. Participants must provide evidence of MSRP of components ( either published on a web-site or a copy of a invoice/receipt with customer identifiable information removed. ) Volume based pricing is not considered. - -The formula for the opex estimate is as follows: - -opex = ( max qps at or greater than the baseline recall @10 threshold ) X ( kilowatt-hour / query ) X ( seconds / hour ) X ( hours / year) X ( 5 years ) X ( dollars / kilowatt-hour ) X ( minimum number of systems needed to scale to support 100,000 qps ) - -Notes on this formula: -* We will use the maximum qps actually measured that meets or exceeds the baseline recall@10 threshold across all query set parameters. -* We do not account for the cost related to the physical footprint of the system(s) such as the cost of the space occupied by the system(s) in the datacenter. -* We assume linear horizontal scalability of systems with zero cost. In other words, we do not account for the costs associated when actually clustering multiple systems needed to obtain 100,000 qps ( networking equipment, costs due to routing traffic among systems, costs due to merging results, etc. ) -* We will use $0.10 / kilowatt-hour for the power consumption cost. -* 5 years is the standard hardware depreciation schedule used for tax purposes with the Internal Revenue Service -* We’d like to thank David Rensin, former Senior Director at Google Cloud, now SVP at Pendo.io for his valuable contribution and consultation with respect to the capex and opex formulas. - -The final ranking will be based on a computed score, which is the sum of the improvements in cost over the baseline for the participating databases. A submission must participate in at least 3 databases. - -There are no direct thresholds for this benchmark/leaderboard. Indirectly, participants that cannot meet or exceed the recall@10 minimum threshold ( or 0.86 for Text2Image ) for a dataset will be dropped from ranking consideration for that dataset. - -## For_Evaluators - -### Evaluating_Participant_Algorithms - -How a participant's algorithm is benchmarked will depend on how they registered for the T3 competition, one of these options: -* Participant sent hardware to competition evaluator at participant's expense. -* Participant is giving the competition valuator remote SSH access to their machine. -* Participant will run the evaluation framework on their own and send the benchmark results to the competition evaluator. - -Evaluation steps for each option is detailed in the next sections. - -### Participant_Sends_Hardware_To_Evaluators - -Evaluators will work with participant's that send hardware during competition on-boarding. Hardware will be sent and returned at the participant's expense. - -Evaluators and participants will work closely to make sure the hardware is properly installed and configured. - -Evaluators may allow remote access to the machines in order to complete the setup, as needed. - -### Participant_Gives_Remote_Access_To_Evaluators - -Participants give competition evaluators access to remote machines via SSH. - -### Participant_Runs_And_Submits_Benchmarks - -This is a very special case, and not all participant's will have this option. In this case, the participant will run the evaluation on their own. They will export the data to a CSV via the export.py script and send it to the the competition evaluators. Participants are still required to submit a pull request and upload their best index. - -## Evaluating_Power_Consumption - -The hardware chassis which houses all the hardware must support the IPMI management interface. - -Determine the IP address, port, and authentication credentials of that interface. - -Follow the instructions at IPMICAP open-source project ( http://www.github.com/fractalsproject/ipmicap ) to access the IPMI and configure it to listen to an available port number. - -Capture the machine IP address of the machine which is running IPMICAP ( it does not have to be the same machine as the target hardware. - -Now run the following for each competition dataset: -``` -python run.py --dataset [DATASET] --t3 --definitions [DEFINITION FILE] --sensors [S1 S2 ...] --sessions --powercapture [IPMICAP_MACHINE_IP]:[IPMICAP_LISTEN_PORT]:[TIME_IN_SECONDS] -``` -where S1, S2,... = the sensor records for all POWER_IN sensors ( please see the IPMCAP documentation to determine these sensor records. - -This will monitor power consumption over that period of time ( 10 seconds is a good number ). - -You can retrieve a plot of the power consumptions ( measured as watt-seconds/query ) using the plot.py script. - diff --git a/t3/TASKS_ISSUES_RESOLUTIONS.md b/t3/TASKS_ISSUES_RESOLUTIONS.md deleted file mode 100644 index 37c782b57..000000000 --- a/t3/TASKS_ISSUES_RESOLUTIONS.md +++ /dev/null @@ -1,46 +0,0 @@ - -# BigANN Challenge T3 Tasks, Issues, and Resolutions - -In the spirit of maintaining a fair and open competition, we will be tracking all important remaining tasks and issues, and their respective resolution - and making that all public here on this README. All competition rankings and winners will be "unofficial" until all tasks and issues have been resolved. - -Participants should send their questions and issues to the T3 organizer directly (gwilliams@gsitechnology.com), or to the competition google group at big-ann-organizers@googlegroups.com. Note that some issues may require a complete re-evaluation of an algorithm on its respective hardware, or may require additional information from a participant or competition organizer(s). - -## Tasks (open) - -* [T3 Organizer self-report] In the private set evaluation, there are issues with the msspace-v ground truth file preventing any submission evaluation and scoring on that dataset. -* [T3 Organizer self-report] In the private set evaluation, there are issues with some submissions crashing on either/both deep-1B and msspacev-1b thus preventing any scoring on that dataset. -* [Microsoft to T3 Organizer] Currently, DiskANN cannot qualify for power and cost benchmarks due to issue with running IPMICAP ( python ipmi in particular seems to be the issue. ) - * PENDING RESOLUTION: [T3 Organizer to Microsoft] We will work on local dcmi support in the IPMICAP server. -* [T3 Organizer to Microsoft] Need to retrieve "results" h5py files from MS DiskANN remote machine. - -## Issues (open) - -* [T3 Organizer self-report] The "opex" power cost for an Nvidia submission seems impossibly low ($80). - * PENDING RESOLUTION: We need to measure quiescent power of a system and establish the min power consumption and troubleshoot the DCMI power reporting on the NVidia system. - -## Resolutions - -* [GSI asked] What does NQ mean? - * [T3 Organizer responded] It could mean 1) team did not submit a qualifying algorithm for the benchmark 2) team decided did not participate in that benchmark 3) unable to get some key data for the benchmark (such as power or system cost, or both ). -* [T3 Organizer self-report] Need to retrieve "results" h5py files from NVidia's remote machine. - * Done on 11/23/2021 -* [T3 Organizer to NVidia] Need to retrieve power monitoring "results" h5py files from NVidia's remote machine. - * Done on 11/23/2021 and subsequently on changes to algos.yaml -* [GSI to T3 Organizer] Need better documentation for how to extract power benchmark from plot.py script. - * Answered via email. Basically, you need to supply "wspq" as an explicit metric you want to retrieve using the chosen axis. Run "python ploy.py --help" to get more information. -* [GSI to T3 Organizers] We cannot reproduce the baseline performance on SSNPP on same/similar hardware. - * Organizer repeated the eval and it was the same. It could have been an issue with faiss (gpu) library and version. -* [GSI to T3 Organizers] Have you discussed taking power also on the recall working point and not just on the throughput working point? -[GSI asks T3 Organizers] Since some algorithms implement smart caching mechanisms to simulate real life scenarios and since the competition framework sends the same queries again and again 50 time for each dataset (5 runs x 10 query configurations) which is not a real life case. It is important that competition framework needs to verify the results, automatically (and if not possible manually) that no caching mechanism is used in between runs and in between query configurations. One way is to make sure that the throughput for the runs doesn’t differ much taking into account that there are 5 runs and 10 configurations with the same queries. Probably a better way is to send for different queries or somehow cool down the cache in between runs by sending random queries. - * The eval framework now implements "possible query response cache" detection and the competition reports this as an anomaly and allows teams to explain why these happen. It's too late in the competition to establish a policy to deal with these "anomalies" such as 1) ask team to mitigate the effect 2) cool the cache with random queries 3) throw out the data. -* [T3 Organizer to Microsoft] Currently reported DiskANN CSV results is using an old version of recall computation (ie, not accounting for ties and it will likely affect msspacev-1B recall mostly). - * This was resolved. Microsoft exported a new csv with the proper recall. -* [GSI to T3 Organizer] New index for SSNPP and Text2Image requires re-evaluation for those datasets and updated scores. - * This was done successfully on the public query set. -* [Intel asks T3 Organizer] Why won't there be one winner for T3 that combines all individual benchmarks? - * We have provided the reason to Intel. We weren't sure how to combine them in this first competition - likely it will be combined in the future. -* [Intel asks T3 Organizer] Why are power and cost rankings optional for a submission? - * We have provided the reason to Intel. We werent sure how easy it would be to support this for all participants in this first competition. -* [T3 Organizer asks NVidia] Can't we use an MSRP from another company as proxy for system cost? - * We will take the cheapest MSRP from third party seller for the leaderboard (we found 150K). We've footnoted this in the rankings. - diff --git a/t3/eval_2021/faiss_t3/prun.sh b/t3/eval_2021/faiss_t3/prun.sh deleted file mode 100755 index a34886dca..000000000 --- a/t3/eval_2021/faiss_t3/prun.sh +++ /dev/null @@ -1,15 +0,0 @@ -#!/bin/bash - -#python run.py --t3 --private-query --definitions t3/faiss_t3/algos.yaml --dataset deep-1B --nodocker -python run.py --t3 --private-query --definitions t3/faiss_t3/algos.yaml --dataset bigann-1B --nodocker -#python run.py --t3 --private-query --definitions t3/faiss_t3/algos.yaml --dataset text2image-1B --nodocker -#python run.py --t3 --private-query --definitions t3/faiss_t3/algos.yaml --dataset msturing-1B --nodocker -#python run.py --t3 --private-query --definitions t3/faiss_t3/algos.yaml --dataset msspacev-1B --nodocker -#python run.py --t3 --private-query --definitions t3/faiss_t3/algos.yaml --dataset ssnpp-1B --nodocker - -#python run.py --definitions t3/faiss_t3/algos.yaml --dataset deep-1B --t3 --private-query --nodocker --power-capture 192.168.99.110:1237:10 -#python run.py --definitions t3/faiss_t3/algos.yaml --dataset bigann-1B --t3 --private-query --nodocker --power-capture 192.168.99.110:1237:10 -#python run.py --definitions t3/faiss_t3/algos.yaml --dataset text2image-1B --t3 --private-query --nodocker --power-capture 192.168.99.110:1237:10 -#python run.py --definitions t3/faiss_t3/algos.yaml --dataset msturing-1B --t3 --private-query --nodocker --power-capture 192.168.99.110:1237:10 -#python run.py --definitions t3/faiss_t3/algos.yaml --dataset msspacev-1B --t3 --private-query --nodocker --power-capture 192.168.99.110:1237:10 -#python run.py --definitions t3/faiss_t3/algos.yaml --dataset ssnpp-1B --t3 --private-query --nodocker --power-capture 192.168.99.110:1237:10 diff --git a/t3/faiss_t3/Dockerfile b/t3/faiss_t3/Dockerfile deleted file mode 100644 index 5720572f6..000000000 --- a/t3/faiss_t3/Dockerfile +++ /dev/null @@ -1,35 +0,0 @@ - -FROM nvidia/cuda:11.0-devel-ubuntu18.04 - -ENV PATH="/root/miniconda3/bin:${PATH}" -ARG PATH="/root/miniconda3/bin:${PATH}" - -# CONDA - -RUN apt-get update && apt-get install -y wget build-essential git - -RUN wget \ - https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh \ - && mkdir /root/.conda \ - && bash Miniconda3-latest-Linux-x86_64.sh -b \ - && rm -f Miniconda3-latest-Linux-x86_64.sh \ - && conda --version \ - && conda install -c pytorch python=3.6.9 faiss-gpu cudatoolkit=11.0 - -RUN conda --version && which conda && which python && which pip3 - -# BIGANN - -RUN pip3 install -U pip - -WORKDIR /home/app -COPY t3/faiss_t3/faiss-gpu_requirements.txt run_algorithm.py ./ -RUN pip3 install -r faiss-gpu_requirements.txt - -ENTRYPOINT ["python3", "run_algorithm.py"] - -## For the following RUN command to work, we need to initiate docker build -## with a gpu device request much like what's done with docker eval run. -# RUN python3 -c 'import faiss; print("gpus=", faiss.get_num_gpus())' - -RUN python3 -c 'import faiss; print(faiss.IndexFlatL2)' diff --git a/t3/faiss_t3/README.md b/t3/faiss_t3/README.md deleted file mode 100644 index d7dadadeb..000000000 --- a/t3/faiss_t3/README.md +++ /dev/null @@ -1,66 +0,0 @@ -# FAISS Baseline - -This README contains information required for T3 Track submissions. - -## Hardware Configuration And Cost - -|Part |Model |No. |Unit Price |Total Price| -|-----------------------------|--------------------------------------------------|----|------------------------------------|-----------| -|Chassis and Motherboard |[Advantech Sky-6200 2U](cost/AdvantechSky6200.pdf)| 1|[5572.42](cost/AdvantechSky6200.pdf)| 5572.42| -|RAM |[Advantech 32GB Memory](cost/RAM.pdf) | 24| [259.00](cost/RAM.pdf)| 6216.00| -|SSD |[2TB SeaGate](cost/SSD.pdf) | 1| [334.48](cost/SSD.pdf)| 334.48| -|GPU |[NVidia V100](cost/GPU.pdf) | 1| [9899.00](cost/GPU.pdf)| 9899.00| -|Total | | 1| | 22021.90| - -## Hardware Access - -This hardware is maintained by the competition organizers. Please send an email to big-ann-organizers@googlegroups.com to get access to a system or see the section below to build your own system. - -## No Source Code Declarations - -This submission requires the following software components where source-code is not available and/or not part of the source-code for this submission: -* NVidia docker container runtime ( https://docs.nvidia.com/datacenter/cloud-native/container-toolkit/install-guide.html ) -* CUDA 11 libraries and host drivers -* NVidia V100 firmware - -## Hardware Setup And Software Installation - -## Prerequisites - -* Linux Ubuntu 18.04 -* CUDA 11.0 -* The NVidia docker container runtime ( https://docs.nvidia.com/datacenter/cloud-native/container-toolkit/install-guide.html ) -* This cloned project repository - -### Test On A Small Dataset - -Note that all the subsequent commands must be run in the top-level directory of this repo on your machine. - -First build the faiss_t3 docker container: -``` -python install.py --dockerfile t3/faiss_t3/Dockerfile -``` -Now create a small random dataset, query set, and associated ground truth: -``` -python create_dataset.py --dataset random-xs -``` -Now build a FAISS index for this dataset: -``` -python run.py --definitions t3/faiss_t3/algos.yaml --dataset random-xs --t3 -``` -This may take an hour or so. When it's done, you can plot the recall-vs-throughput results as follows: -``` -python plot.py --definitions t3/faiss_t3/algos.yaml --dataset random-xs -``` -You can now run on the competition datasets. - -#### Known Issues - -The NVidia GPU docker support for various Linux distributions involves a lot of steps. - -The run.py script also supports a "--nodocker" flag. When run in this way, the algorithm is not launched in a docker container. Obviously, this requires having CUDA 11.0 drivers working natively on your system, and the installation of the compatible FAISS GPU library. - -If you take this route, we recommend using the Anaconda distribution of python, creating a python=3.8.5 environment, and installing FAISS using this command: -``` -conda install -c pytorch faiss-gpu cudatoolkit=11.0 -``` diff --git a/t3/faiss_t3/algos.yaml b/t3/faiss_t3/algos.yaml deleted file mode 100644 index 4919134e6..000000000 --- a/t3/faiss_t3/algos.yaml +++ /dev/null @@ -1,231 +0,0 @@ -random-xs: - faiss-t3: - docker-tag: billion-scale-benchmark-faiss_t3 - module: benchmark.algorithms.faiss_t3 - constructor: FaissT3 - base-args: ["@metric"] - run-groups: - base: - # the following args show all build arguments that can be provided to the t3 baseline. - args: | - [{"indexkey": "IVF5,SQ8", - "buildthreads": -1, - "by_residual": -1, - "add_bs": 100000, - "maxtrain": 0, - "clustering_niter": -1, - "add_splits": 1, - "no_precomputed_tables": true, - "searchthreads": -1, - "parallel_mode": 3, - "search_bs": 8192 - }] - query-args: | - ["nprobe=1", - "nprobe=2", - "nprobe=4", - "nprobe=8", - "nprobe=16", - "nprobe=32", - "nprobe=64", - "nprobe=128", - "nprobe=256"] -deep-1B: - faiss-t3: - docker-tag: billion-scale-benchmark-faiss_t3 - module: benchmark.algorithms.faiss_t3 - constructor: FaissT3 - base-args: ["@metric"] - run-groups: - base: - args: | - [{"indexkey": "IVF1048576,SQ8", - "url":"https://storage.googleapis.com/bigann/indexes/faiss/1.7.1/deep-1B.IVF1048576%2CSQ8.faissindex"}] - query-args: | - ["nprobe=90", - "nprobe=100", - "nprobe=110", - "nprobe=120", - "nprobe=128", - "nprobe=140", - "nprobe=160", - "nprobe=180", - "nprobe=200", - "nprobe=220"] -bigann-1B: - faiss-t3: - docker-tag: billion-scale-benchmark-faiss_t3 - module: benchmark.algorithms.faiss_t3 - constructor: FaissT3 - base-args: ["@metric"] - run-groups: - base: - args: | - [{"indexkey": "IVF1048576,SQ8", - "url":"https://storage.googleapis.com/bigann/indexes/faiss/1.7.1/bigann-1B.IVF1048576%2CSQ8.faissindex"}] - query-args: | - ["nprobe=90", - "nprobe=100", - "nprobe=110", - "nprobe=120", - "nprobe=128", - "nprobe=140", - "nprobe=160", - "nprobe=180", - "nprobe=200", - "nprobe=220"] -msspacev-1B: - faiss-t3: - docker-tag: billion-scale-benchmark-faiss_t3 - module: benchmark.algorithms.faiss_t3 - constructor: FaissT3 - base-args: ["@metric"] - run-groups: - base: - args: | - [{"indexkey": "IVF1048576,SQ8", - "url":"https://storage.googleapis.com/bigann/indexes/faiss/1.7.1/msspacev-1B.IVF1048576%2CSQ8.faissindex"}] - query-args: | - ["nprobe=1", - "nprobe=2", - "nprobe=4", - "nprobe=8", - "nprobe=16", - "nprobe=32", - "nprobe=64", - "nprobe=128", - "nprobe=256"] -text2image-1B: - faiss-t3: - docker-tag: billion-scale-benchmark-faiss_t3 - module: benchmark.algorithms.faiss_t3 - constructor: FaissT3 - base-args: ["@metric"] - run-groups: - base: - args: | - [{"indexkey": "IVF1048576,SQ8", - "url":"https://storage.googleapis.com/bigann/indexes/faiss/1.7.1/text2image-1B.IVF1048576%2CSQ8.faissindex"}] - query-args: | - ["nprobe=90", - "nprobe=100", - "nprobe=110", - "nprobe=120", - "nprobe=128", - "nprobe=140", - "nprobe=160", - "nprobe=180", - "nprobe=200", - "nprobe=220"] -msturing-10M: - faiss-t3: - docker-tag: billion-scale-benchmark-faiss_t3 - module: benchmark.algorithms.faiss_t3 - constructor: FaissT3 - base-args: ["@metric"] - run-groups: - base: - args: | - [{"indexkey": "IVF1048576,SQ8", - "url":"https://storage.googleapis.com/bigann/indexes/faiss/1.7.1/msturing-10M.IVF1048576%2CSQ8.faissindex"}] - query-args: | - ["nprobe=1", - "nprobe=2", - "nprobe=4", - "nprobe=8", - "nprobe=16", - "nprobe=32", - "nprobe=64", - "nprobe=128", - "nprobe=256"] -msturing-1B: - faiss-t3: - docker-tag: billion-scale-benchmark-faiss_t3 - module: benchmark.algorithms.faiss_t3 - constructor: FaissT3 - base-args: ["@metric"] - run-groups: - base: - args: | - [{"indexkey": "IVF1048576,SQ8", - "url":"https://storage.googleapis.com/bigann/indexes/faiss/1.7.1/msturing-1B.IVF1048576%2CSQ8.faissindex"}] - query-args: | - ["nprobe=28", - "nprobe=32", - "nprobe=37", - "nprobe=42", - "nprobe=47", - "nprobe=52", - "nprobe=57", - "nprobe=62", - "nprobe=64", - "nprobe=70"] -ssnpp-1M: - faiss-t3: - docker-tag: billion-scale-benchmark-faiss_t3 - module: benchmark.algorithms.faiss_t3 - constructor: FaissT3 - base-args: ["@metric"] - run-groups: - base: - args: | - [{"indexkey": "OPQ32_128,IVF100_HNSW32,PQ32", - "url":"https://storage.googleapis.com/bigann/indexes/faiss/1.7.1/ssnpp-1M.IVF1048576%2CSQ8.faissindex", - "parallel_mode": 2, - "add_splits": 0}] - query-args: | - ["nprobe=1", - "nprobe=2", - "nprobe=4", - "nprobe=8", - "nprobe=16", - "nprobe=32", - "nprobe=64", - "nprobe=128", - "nprobe=256"] -ssnpp-10M: - faiss-t3: - docker-tag: billion-scale-benchmark-faiss_t3 - module: benchmark.algorithms.faiss_t3 - constructor: FaissT3 - base-args: ["@metric"] - run-groups: - base: - args: | - [{"indexkey": "OPQ32_128,IVF1048576_HNSW32,PQ32", - "url":"https://storage.googleapis.com/bigann/indexes/faiss/1.7.1/ssnpp-10M.OPQ32_128%2CIVF1048576_HNSW32%2CPQ32.faissindex", - "parallel_mode": 2, - "add_splits": 0}] - query-args: | - ["nprobe=1", - "nprobe=2", - "nprobe=4", - "nprobe=8", - "nprobe=16", - "nprobe=32", - "nprobe=64", - "nprobe=128", - "nprobe=256"] -ssnpp-1B: - faiss-t3: - docker-tag: billion-scale-benchmark-faiss_t3 - module: benchmark.algorithms.faiss_t3 - constructor: FaissT3 - base-args: ["@metric"] - run-groups: - base: - args: | - [{"indexkey": "IVF1048576,SQ8", - "url":"https://storage.googleapis.com/bigann/indexes/faiss/1.7.1/ssnpp-1B.IVF1048576%2CSQ8.faissindex", - "parallel_mode": 2, - "add_splits": 0}] - query-args: | - ["nprobe=1", - "nprobe=2", - "nprobe=4", - "nprobe=8", - "nprobe=16", - "nprobe=32", - "nprobe=64", - "nprobe=128", - "nprobe=256"] diff --git a/t3/faiss_t3/baseline_plots/bigann-1B-r-vs-p.png b/t3/faiss_t3/baseline_plots/bigann-1B-r-vs-p.png deleted file mode 100755 index fcbbe1470..000000000 Binary files a/t3/faiss_t3/baseline_plots/bigann-1B-r-vs-p.png and /dev/null differ diff --git a/t3/faiss_t3/baseline_plots/bigann-1B-r-vs-t.png b/t3/faiss_t3/baseline_plots/bigann-1B-r-vs-t.png deleted file mode 100755 index b0dac5d7f..000000000 Binary files a/t3/faiss_t3/baseline_plots/bigann-1B-r-vs-t.png and /dev/null differ diff --git a/t3/faiss_t3/baseline_plots/deep-1B-r-vs-p.png b/t3/faiss_t3/baseline_plots/deep-1B-r-vs-p.png deleted file mode 100755 index ea9594c98..000000000 Binary files a/t3/faiss_t3/baseline_plots/deep-1B-r-vs-p.png and /dev/null differ diff --git a/t3/faiss_t3/baseline_plots/deep-1B-r-vs-t.png b/t3/faiss_t3/baseline_plots/deep-1B-r-vs-t.png deleted file mode 100755 index f5d7e0265..000000000 Binary files a/t3/faiss_t3/baseline_plots/deep-1B-r-vs-t.png and /dev/null differ diff --git a/t3/faiss_t3/baseline_plots/msspacev-1B-r-vs-p.png b/t3/faiss_t3/baseline_plots/msspacev-1B-r-vs-p.png deleted file mode 100755 index dc25cc1b9..000000000 Binary files a/t3/faiss_t3/baseline_plots/msspacev-1B-r-vs-p.png and /dev/null differ diff --git a/t3/faiss_t3/baseline_plots/msspacev-1B-r-vs-t.png b/t3/faiss_t3/baseline_plots/msspacev-1B-r-vs-t.png deleted file mode 100755 index 6c69b3b2d..000000000 Binary files a/t3/faiss_t3/baseline_plots/msspacev-1B-r-vs-t.png and /dev/null differ diff --git a/t3/faiss_t3/baseline_plots/msturing-1B-r-vs-p.png b/t3/faiss_t3/baseline_plots/msturing-1B-r-vs-p.png deleted file mode 100755 index 80912d64e..000000000 Binary files a/t3/faiss_t3/baseline_plots/msturing-1B-r-vs-p.png and /dev/null differ diff --git a/t3/faiss_t3/baseline_plots/msturing-1B-r-vs-t.png b/t3/faiss_t3/baseline_plots/msturing-1B-r-vs-t.png deleted file mode 100755 index df8df2b09..000000000 Binary files a/t3/faiss_t3/baseline_plots/msturing-1B-r-vs-t.png and /dev/null differ diff --git a/t3/faiss_t3/baseline_plots/text2image-1B-r-vs-p.png b/t3/faiss_t3/baseline_plots/text2image-1B-r-vs-p.png deleted file mode 100644 index bc0aa5afe..000000000 Binary files a/t3/faiss_t3/baseline_plots/text2image-1B-r-vs-p.png and /dev/null differ diff --git a/t3/faiss_t3/baseline_plots/text2image-1B-r-vs-t.png b/t3/faiss_t3/baseline_plots/text2image-1B-r-vs-t.png deleted file mode 100644 index e0be37dbf..000000000 Binary files a/t3/faiss_t3/baseline_plots/text2image-1B-r-vs-t.png and /dev/null differ diff --git a/t3/faiss_t3/cost/AdvantechSky6200.pdf b/t3/faiss_t3/cost/AdvantechSky6200.pdf deleted file mode 100644 index c0012482d..000000000 Binary files a/t3/faiss_t3/cost/AdvantechSky6200.pdf and /dev/null differ diff --git a/t3/faiss_t3/cost/GPU.pdf b/t3/faiss_t3/cost/GPU.pdf deleted file mode 100644 index 01871eb40..000000000 Binary files a/t3/faiss_t3/cost/GPU.pdf and /dev/null differ diff --git a/t3/faiss_t3/cost/RAM.pdf b/t3/faiss_t3/cost/RAM.pdf deleted file mode 100644 index a65b66027..000000000 Binary files a/t3/faiss_t3/cost/RAM.pdf and /dev/null differ diff --git a/t3/faiss_t3/cost/SSD.pdf b/t3/faiss_t3/cost/SSD.pdf deleted file mode 100644 index 2010b2910..000000000 Binary files a/t3/faiss_t3/cost/SSD.pdf and /dev/null differ diff --git a/t3/faiss_t3/faiss-gpu_requirements.txt b/t3/faiss_t3/faiss-gpu_requirements.txt deleted file mode 100644 index 5fe6dabde..000000000 --- a/t3/faiss_t3/faiss-gpu_requirements.txt +++ /dev/null @@ -1,11 +0,0 @@ -ansicolors==1.1.8 -docker==2.6.1 -h5py==2.10.0 -matplotlib -numpy -pyyaml==5.1 -psutil==5.6.6 -scipy -scikit-learn -jinja2==2.10.1 -pandas diff --git a/t3/gemini/.gitignore b/t3/gemini/.gitignore deleted file mode 100644 index 031f4fc40..000000000 --- a/t3/gemini/.gitignore +++ /dev/null @@ -1,3 +0,0 @@ -1b -centroids_2m -records_weights diff --git a/t3/gemini/README.md b/t3/gemini/README.md deleted file mode 100644 index 19e929900..000000000 --- a/t3/gemini/README.md +++ /dev/null @@ -1,65 +0,0 @@ -# Gemini - -This README contains information required for T3 Track submissions. - -## Hardware Configuration And Cost - -|Part |Model |No. |Unit Price |Total Price| -|-----------------------------|--------------------------------------------------|----|------------------------------------|-----------| -|Chassis and Motherboard |[Advantech Sky-6200 2U](cost/AdvantechSky6200.pdf)| 1|[5572.42](cost/AdvantechSky6200.pdf)| 5572.42| -|RAM |[Advantech 64GB Memory](cost/RAM.pdf) | 24| [409.99](cost/RAM.pdf)| 9839.76| -|SSD |[2TB SeaGate](cost/SSD.pdf) | 1| [334.48](cost/SSD.pdf)| 334.48| -|APU |[LedaE APU](cost/APU.pdf) | 4| [35000.00](cost/APU.pdf)| 140000.00| -|GPU |[NVidia V100](cost/GPU.pdf) | 1| [9899.00](cost/GPU.pdf)| 9899.00| -|Total | | 1| | 165645.66| - -## Hardware Access - -This hardware is maintained by the GSI Technology, one of the competition organizers. Please send an email to big-ann-organizers@googlegroups.com or gwilliams@gsitechnology.com to get access to a system or see the section below to build your own system. - -## No Source Code Declarations - -This submission requires the following software components where source-code is not available and/or not part of the source-code for this submission: -* NVidia docker container runtime ( https://docs.nvidia.com/datacenter/cloud-native/container-toolkit/install-guide.html ) -* CUDA 11 libraries and host drivers -* NVidia V100 firmware compatible with CUDA 11 -* Gemini Software system software and host drivers (version TBD) -* Gemini pyGSL vector search library (version TBD) -* LedaE PCIe board firmware (version TBD) - -## Hardware Setup And Software Installation - -### Prerequisites - -* Linux Ubuntu 18.04 -* Python 3.69 -* Python package requirements in [requirements.txt](requirements.txt) -* CUDA 11.0 -* The NVidia docker container runtime ( https://docs.nvidia.com/datacenter/cloud-native/container-toolkit/install-guide.html ) -* Gemini system software and host drivers ( please follow the instructions that came with your Leda hardware.) -* This cloned project repository - -### Test Your Leda Hardware - -At the command line run the following diagnostic program to make sure your boards are operational: - -```dev_diagnostic --iter 1 --run-all-cards 1``` - -### pyGSL Libraries - -Download the pyGSL libraries from [here](https://storage.googleapis.com/bigann/gemini/gsl_resources.tar.gz.1) and unpack into the toplevel directory of the cloned repository. - -### Competition Index Files - -Currently the competition index files must be downloaded and installed manually. - -Download all the index files from [here](tbd) (TBD) and unpack into the cloned repo's data directory. - -## Run The Competition Algorithm - -In the top-level directory of the cloned repository, run the following command: - -```t3/gemini/run_bin_python.sh``` - -Note that it will take a few minutes for all the index files to load, so be patient. - diff --git a/t3/gemini/algos.yaml b/t3/gemini/algos.yaml deleted file mode 100644 index e590bf96f..000000000 --- a/t3/gemini/algos.yaml +++ /dev/null @@ -1,25 +0,0 @@ -deep-1B: - gemini-t3: - docker-tag: billion-scale-benchmark-faissconda - module: benchmark.algorithms.gemini - constructor: GeminiT3 - base-args: ["@metric"] - run-groups: - base: - args: | - [ - "{'nbits': 512, 'qbits':768, 'nlist':2097152, 'nt':83886080, 'num_apuc':3, 'f16':True }" - ] - query-args: | - [ - "{'nprobe': 800, 'nprobe_refine': 480, 'hamming_k': 5000, 'average_clstr_size_factor': 0.0}", - "{'nprobe': 800, 'nprobe_refine': 480, 'hamming_k': 2000, 'average_clstr_size_factor': 0.0}", - "{'nprobe': 800, 'nprobe_refine': 480, 'hamming_k': 1000, 'average_clstr_size_factor': 0.0}", - "{'nprobe': 800, 'nprobe_refine': 480, 'hamming_k': 500, 'average_clstr_size_factor': 0.0}", - "{'nprobe': 800, 'nprobe_refine': 480, 'hamming_k': 250, 'average_clstr_size_factor': 0.0}", - "{'nprobe': 800, 'nprobe_refine': 400, 'hamming_k': 1000, 'average_clstr_size_factor': 0.0}", - "{'nprobe': 800, 'nprobe_refine': 300, 'hamming_k': 1000, 'average_clstr_size_factor': 0.0}", - "{'nprobe': 700, 'nprobe_refine': 380, 'hamming_k': 1000, 'average_clstr_size_factor': 0.0}", - "{'nprobe': 600, 'nprobe_refine': 280, 'hamming_k': 1000, 'average_clstr_size_factor': 0.0}", - "{'nprobe': 500, 'nprobe_refine': 180, 'hamming_k': 1000, 'average_clstr_size_factor': 0.0}" - ] diff --git a/t3/gemini/buildidx/build_index.py b/t3/gemini/buildidx/build_index.py deleted file mode 100644 index 38c2fe16c..000000000 --- a/t3/gemini/buildidx/build_index.py +++ /dev/null @@ -1,167 +0,0 @@ -import os -import numpy as np -import h5py -import faiss -import sys - -# -# Get parameters -# -dbase = "deep-1B" -nlist = 2097152 -qbits = 768 -nbits = 512 -nt = 83886080 -is_f16 = True -num_records = 1000000000 -output_dir = "/mnt/localdisk2/George/Projects/BigANN/gemini/indexes" - -# -# Form the path to the source files -# -resources_path = '../../t3/gsi/' -case_dir = '1b/' -resources_path_case = f'{resources_path}{case_dir}' -centroids_dirs = { 524288: 'centroids_512k/', 2097152: 'centroids_2m/', 4194304: 'centroids_4m/'} -num_centroids_dir = centroids_dirs[nlist] -fp_quantizer_file_name = f'{resources_path}{num_centroids_dir}Deep1B.nt{nt}.nlist{nlist}.quantizer' -records_encoding_file_name = f'{resources_path}records_weights/records_weights.bits{nbits}.npy' -centroids_encoding_file_name = f'{resources_path}{num_centroids_dir}centroids_weights.nt{nt}.nlist{nlist}.nbits{nbits}.npy' -index_file_name = f'{resources_path_case}Deep1B.ivfbinnh.nt{nt}.nlist{nlist}.nb{num_records}.bits{qbits}.index' -db_path = f'{resources_path_case}fdb.npy' - -# -# Validate all the source files exists -# -print('********************** Paths ***************************') -print('fp_quantizer_file_name =', fp_quantizer_file_name) -if not os.path.isfile(fp_quantizer_file_name): - raise FileNotFoundError(fp_quantizer_file_name) -print('records_encoding_file_name =', records_encoding_file_name) -if not os.path.isfile(records_encoding_file_name): - raise FileNotFoundError(records_encoding_file_name) -print('centroids_encoding_file_name =', centroids_encoding_file_name) -if not os.path.isfile(centroids_encoding_file_name): - raise FileNotFoundError(centroids_encoding_file_name) -print('index_file_name =', index_file_name) -if not os.path.isfile(index_file_name): - raise FileNotFoundError(index_file_name) -print('db_path =', db_path) -if not os.path.isfile(db_path): - raise FileNotFoundError(db_path) -print('********************************************************') - -# -# Form the path to the output index file -# -output_file = "%s.nbits=%d,qbits=%d,nlist=%d,nt=%d,nb=%d,fp16=%s.geminiindex" % ( dbase, nbits, qbits, nlist, nt, num_records, str(is_f16)) -full_path = os.path.join( output_dir, output_file ) -print("Checking if index file already exists (%s)" % full_path) -if os.path.exists(full_path): - raise Exception("gemini index file already exists (%s)" % full_path ) - -# -# Load the source files -# -def convert_index_to_cluster_and_ids_lists(index, nbits): - cluster_list = np.empty(index.invlists.nlist, dtype=object) - ids_list = np.empty(index.invlists.nlist, dtype=object) - - zero_count = 0 - - for i in range(index.invlists.nlist): - list_sz = index.invlists.list_size(i) - - if list_sz == 0: - zero_count = zero_count + 1 - ids = None - else: - ids_ptr = index.invlists.get_ids(i) - ids = np.array(faiss.rev_swig_ptr(ids_ptr, list_sz)).reshape(-1, 1).astype(np.uint32) # GSL requires a 2d arrray for some reason - index.invlists.release_ids(ids_ptr) - # index.invlists.release_ids(list_sz, ids_ptr) - ids_list[i] = ids - - codes_ptr = index.invlists.get_codes(i) - codes = np.array(faiss.rev_swig_ptr(codes_ptr, list_sz * nbits // 8)).reshape(list_sz, nbits//8) - index.invlists.release_codes(codes_ptr) - # index.invlists.release_codes(list_sz * nbits // 8, codes_ptr) - cluster_list[i] = codes - - print('zero_count =', zero_count) - return cluster_list, ids_list - -def get_cluster_and_ids_lists(index, nbits): - print('Creating cluster + ids lists...') - ret = convert_index_to_cluster_and_ids_lists(index, nbits) - return ret - -print("Reading binary index %s" % index_file_name) -index = faiss.read_index_binary(index_file_name) - -print("Extracting binary cluster list and ids") -# cluster_list, ids_list = get_cluster_and_ids_lists(self.index, nbits) -cluster_list, ids_list = get_cluster_and_ids_lists(index, qbits) -print(type(cluster_list), type(ids_list), cluster_list[0].shape, cluster_list[0].dtype, cluster_list[1].shape, ids_list[0].shape, ids_list[0].dtype) - -print("Extracting binary quantizer and centroids") -quantizer = faiss.downcast_IndexBinary(index.quantizer) -centroids = faiss.vector_to_array(quantizer.xb) -centroids = np.reshape(centroids, (quantizer.ntotal, quantizer.d//8)) -print('Got centroids (binary):', centroids.shape, centroids.dtype) - -print("Extracting float quantizer and centroids") -l2_quantizer = faiss.read_index(fp_quantizer_file_name) -l2_centroids = faiss.vector_float_to_array(l2_quantizer.xb) -l2_centroids = np.reshape(l2_centroids, (nlist, l2_quantizer.d)) -print('Got centroids (float):', l2_centroids.shape, l2_centroids.dtype) - -print("Reading centroids encoding file") -centroids_encoding_np = np.load(centroids_encoding_file_name) - -print("Reading records encoding file") -records_encoding_np = np.load(records_encoding_file_name) - -# -# Create the monolithic index and save -# -def add_ndarray_with_type_object( h5f, name, arr ): - print("arrs", arr[0].shape, arr[0].dtype, arr[1].shape, arr[0].dtype) - dt = h5py.vlen_dtype(arr[0].dtype) - dset = h5f.create_dataset(name, arr.shape, dtype=dt) - print("dt", dt, dset) - for i in range( arr.shape[0] ): - item = arr[i] - #print("item",i, type(item)), - if item!=None: dset[i] = item.reshape(-1) - else: dset[i] = item - -print("Creating (h5py) index file at %s" % full_path) -h5f = h5py.File(full_path, 'w') - -print("Adding cluster_list") -#h5f.create_dataset('cluster_list', data=cluster_list) -add_ndarray_with_type_object( h5f, "cluster_list", cluster_list ) - -print("Adding ids_list") -#h5f.create_dataset('ids_list', data=ids_list) -add_ndarray_with_type_object( h5f, "ids_list", ids_list ) - -print("Adding binary centroids") -h5f.create_dataset('centroids', data=centroids) - -print("Adding float centroids") -h5f.create_dataset('l2_centroids', data=l2_centroids) - -print("Adding centroids_encoding") -h5f.create_dataset('centroids_encoding_np', data=centroids_encoding_np) - -print("Adding records_encoding") -h5f.create_dataset('records_encoding_np', data=records_encoding_np) - -print("Adding dataset") -h5f.create_dataset(' -print("Finalizing and closing index.") -h5f.close() - -printf("Done. Wrote index at %s" % full_path ) diff --git a/t3/gemini/buildidx/htest.py b/t3/gemini/buildidx/htest.py deleted file mode 100644 index 8d6888229..000000000 --- a/t3/gemini/buildidx/htest.py +++ /dev/null @@ -1,101 +0,0 @@ -import h5py -import numpy as np -import sys - -if True: - arr = np.empty( (2,), dtype=object) - a = np.random.rand( 3,4 ) - b = np.random.rand( 2,4 ) - arr[0] = a - arr[1] = b - print("arr", arr) - - f = h5py.File('/tmp/foo.hdf5','w') - dt = h5py.vlen_dtype(a.dtype) - dset = f.create_dataset('vlen_int', arr.shape, dtype=dt) - - a = a.reshape( -1 ) - dset[0] = a - - b = b.reshape( -1 ) - dset[1] = b - - farr = dset[0:] - print(farr.shape, farr.dtype) - - narr = np.empty( (2, ), dtype=object) - for i in range(2): - narr[i] = dset[i].reshape( -1, 4 ) - - print("narr", narr) - sys.exit(0) - -if True: - f = h5py.File('/tmp/foo.hdf5','w') - dt = h5py.vlen_dtype(np.dtype('int32')) - dset = f.create_dataset('vlen_int', (2,), dtype=dt) - dset[0] = [1,2,3,4] - dset[1] = [1,2,3,4,5] - print(type(dset[0]),dset[0].dtype,dset[0].shape) - arr = dset[0] - a = arr.reshape( (2,2) ) - print("a",a, a.shape) - print(dset[0:2]) - print(np.reshape(dset[0],(None,2))) - print(dset[1]) - sys.exit(0) - -if False: - f = h5py.File('/tmp/foo.hdf5','w') - float32_t = h5py.special_dtype(vlen=np.dtype('float32')) - evolutionary_ = f.create_dataset('evolutionary', shape=(1, 3,), maxshape=(None, 3,), dtype=float32_t) - a = np.random.randn(1, 3, 4) - b = np.random.randn(1, 3, 6) - - evolutionary_[0] = a - print('evo[0] is \n', evolutionary_.value) - - evolutionary_.resize(3, axis=0) - evolutionary_[1] = b - print('evo[0,1,2] is\n', evolutionary_.value) - - sys.exit(0) - -if True: - f = h5py.File('/tmp/foo.hdf5','w') - dt = h5py.special_dtype(vlen=np.dtype('float32')) - dset = f.create_dataset('vlen_int', shape=(1,3,), maxshape=(None,3,), dtype=dt) - dset[0] = np.random.randn( 1, 3, 3 ) - dset.resize(3, axis=0) - dset[1] = np.random.randn( 1, 3, 1 ) - print( dset[0:] ) - - sys.exit(0) - -arr = np.empty(1, dtype=object) -print(type(arr), arr.shape, arr.dtype) - -a = np.ones( (2,2 )) -print(type(a), a.shape, a.dtype) -arr[0] = a - -h5f = h5py.File("/tmp/test", 'w') - -print("Adding cluster_list") -#h5f.create_dataset('cluster_list', data=arr) - -def add_ndarray_with_type_object( h5f, name, arr ): - print(type(arr), type(arr[0]), arr) - dt = arr[0].dtype - print("add", dt, arr.shape) - v = h5py.vlen_dtype(dt) - dset = h5f.create_dataset(name, arr.shape, dtype=dt) - for i in range( arr.shape[0] ): - dset[i] = arr[i] - print( type(dset) ) - print( dset ) - print( dset[0:] ) - -add_ndarray_with_type_object( h5f, "cluster_list", arr ) - -h5f.close() diff --git a/t3/gemini/buildidx/run_bin_build_index.sh b/t3/gemini/buildidx/run_bin_build_index.sh deleted file mode 100755 index 0d87d0953..000000000 --- a/t3/gemini/buildidx/run_bin_build_index.sh +++ /dev/null @@ -1,3 +0,0 @@ -#!/bin/bash - -PATH=/usr/bin:$PATH python3 build_index.py diff --git a/t3/gemini/buildidx/test.py b/t3/gemini/buildidx/test.py deleted file mode 100644 index 31044945c..000000000 --- a/t3/gemini/buildidx/test.py +++ /dev/null @@ -1,63 +0,0 @@ -import faiss -import numpy as np - -qd=768 -d=512 -nlist=5 - -nb=1000 -db = np.empty((nb, d // 8), dtype='uint8') - -quantizer = faiss.IndexBinaryFlat( d ) -index = faiss.IndexBinaryIVF( quantizer, d, nlist ) -index.train(db) -index.add(db) - -def convert_index_to_cluster_and_ids_lists(index, nbits): - cluster_list = np.empty(index.invlists.nlist, dtype=object) - ids_list = np.empty(index.invlists.nlist, dtype=object) - - zero_count = 0 - - for i in range(index.invlists.nlist): - list_sz = index.invlists.list_size(i) - - if list_sz == 0: - zero_count = zero_count + 1 - ids = None - else: - ids_ptr = index.invlists.get_ids(i) - ids = np.array(faiss.rev_swig_ptr(ids_ptr, list_sz)).reshape(-1, 1).astype(np.uint32) # GSL requires a 2d arrray for some reason - index.invlists.release_ids(ids_ptr) - #GW index.invlists.release_ids(list_sz, ids_ptr) - ids_list[i] = ids - - codes_ptr = index.invlists.get_codes(i) - codes = np.array(faiss.rev_swig_ptr(codes_ptr, list_sz * nbits // 8)).reshape(list_sz, nbits//8) - index.invlists.release_codes(codes_ptr) - #GW index.invlists.release_codes(list_sz * nbits // 8, codes_ptr) - cluster_list[i] = codes - - print('zero_count =', zero_count) - return cluster_list, ids_list - -cls, ids = convert_index_to_cluster_and_ids_lists(index,d) -print("cls", cls) -print("ids", ids) - -# Querying the index -nq = 10 -queries = np.empty((nq, d // 8), dtype='uint8') -print("queries", queries) -k = 1 -D, I = index.search(queries, k) -print("di",D,I) - - -quantizer = faiss.downcast_IndexBinary(index.quantizer) -print("Quantizer", type(quantizer)) -centroids = faiss.vector_to_array(quantizer.xb) -print("Centroids", type(centroids), centroids.shape) -centroids = np.reshape(centroids, (quantizer.ntotal, quantizer.d//8)) -print("Centroids", type(centroids), centroids.shape) -print('centroids (binary):', centroids.shape, centroids.dtype) diff --git a/t3/gemini/cost/AdvantechSky6200.pdf b/t3/gemini/cost/AdvantechSky6200.pdf deleted file mode 100644 index c0012482d..000000000 Binary files a/t3/gemini/cost/AdvantechSky6200.pdf and /dev/null differ diff --git a/t3/gemini/cost/GPU.pdf b/t3/gemini/cost/GPU.pdf deleted file mode 100644 index 01871eb40..000000000 Binary files a/t3/gemini/cost/GPU.pdf and /dev/null differ diff --git a/t3/gemini/cost/RAM.pdf b/t3/gemini/cost/RAM.pdf deleted file mode 100644 index 168285fbd..000000000 Binary files a/t3/gemini/cost/RAM.pdf and /dev/null differ diff --git a/t3/gemini/cost/SSD.pdf b/t3/gemini/cost/SSD.pdf deleted file mode 100644 index 2010b2910..000000000 Binary files a/t3/gemini/cost/SSD.pdf and /dev/null differ diff --git a/t3/gemini/requirements.txt b/t3/gemini/requirements.txt deleted file mode 100644 index f62d93c6a..000000000 --- a/t3/gemini/requirements.txt +++ /dev/null @@ -1,12 +0,0 @@ -numpy==1.16.0 -scipy==1.0.0 -scikit-learn==0.19.1 -faiss==1.5.3 -docker==2.6.1 -psutil==5.6.6 -h5py==2.10.0 -ansicolors==1.1.8 -tqdm==4.62.2 -dataclasses==0.8 -pyyaml -matplotlib diff --git a/t3/gemini/run_bin_python.sh b/t3/gemini/run_bin_python.sh deleted file mode 100755 index c5a21a8ca..000000000 --- a/t3/gemini/run_bin_python.sh +++ /dev/null @@ -1,18 +0,0 @@ -#!/bin/bash - -PATH=/usr/bin:$PATH which python3 -PATH=/usr/bin:$PATH python3 -c "import numpy;print('numpy',numpy.version.version)" -PATH=/usr/bin:$PATH pip3 show numpy - -PATH=/usr/bin:$PATH python3 -c "import scipy;print('scipy',scipy.version.version)" -PATH=/usr/bin:$PATH pip3 show scipy - -PATH=/usr/bin:$PATH python3 -c "import sklearn;print('sklearn',sklearn.__version__)" -PATH=/usr/bin:$PATH pip3 show sklearn - -PATH=/usr/bin:$PATH python3 -c "import faiss;print('faiss',faiss.__version__)" -PATH=/usr/bin:$PATH pip3 show faiss - -PATH=/usr/bin:$PATH LD_LIBRARY_PATH="./gsl_resources:$HOME/.local/lib/python3.6/site-packages/faiss" PYTHONPATH="./gsl_resources:$HOME/.local/lib/python3.6/site-packages/faiss" python3 run.py --t3 --nodocker --definitions t3/gemini/algos.yaml --dataset deep-1B --runs 1 - -#PATH=/usr/bin:$PATH LD_LIBRARY_PATH="/home/silo/BigANN/big-ann-benchmarks/gsl_resources:/home/silo/.local/lib/python3.6/site-packages/faiss" PYTHONPATH="/home/silo/BigANN/big-ann-benchmarks/gsl_resources:/home/silo/.local/lib/python3.6/site-packages/faiss" python3 run.py --t3 --nodocker --definitions t3/gemini/algos.yaml --dataset deep-1B --runs 1 diff --git a/t3/gemini/run_conda_python.sh b/t3/gemini/run_conda_python.sh deleted file mode 100755 index 24c7d2da3..000000000 --- a/t3/gemini/run_conda_python.sh +++ /dev/null @@ -1,20 +0,0 @@ -#!/bin/bash -#set -x - -#conda activate bigann-silo-py369 -which python3 -which pip3 - -python3 -c "import numpy;print('numpy',numpy.version.version)" -pip3 show numpy - -python3 -c "import scipy;print('scipy',scipy.version.version)" -pip3 show scipy - -python3 -c "import sklearn;print('sklearn',sklearn.__version__)" -pip3 show sklearn - -python3 -c "import faiss;print('faiss',faiss.__version__)" -pip3 show faiss - -LD_LIBRARY_PATH=./gsl_resources PYTHONPATH=./gsl_resources python3 run.py --t3 --nodocker --definitions t3/gemini/algos.yaml --dataset deep-1B --runs 1 diff --git a/templates/chartjs.template b/templates/chartjs.template index 466e3555b..2199afd90 100644 --- a/templates/chartjs.template +++ b/templates/chartjs.template @@ -1,102 +1,102 @@ -

{{xlabel}}/{{ylabel}}

-
- - -
- {% if args.latex %} -
-
- -
-
- - - {% endif %} +

{{xlabel}}/{{ylabel}}

+
+ + +
+ {% if args.latex %} +
+
+ +
+
+ + + {% endif %} diff --git a/templates/detail_page.html b/templates/detail_page.html index ce6193c2f..2f65c4b6e 100644 --- a/templates/detail_page.html +++ b/templates/detail_page.html @@ -1,23 +1,23 @@ -{% extends "general.html" %} - +{% extends "general.html" %} + diff --git a/templates/latex.template b/templates/latex.template index 438353418..c64643dba 100644 --- a/templates/latex.template +++ b/templates/latex.template @@ -1,30 +1,30 @@ - -\begin{figure} - \centering - \begin{tikzpicture} - \begin{axis}[ - xlabel={ {{xlabel}} }, - ylabel={ {{ylabel}} }, - ymode = log, - yticklabel style={/pgf/number format/fixed, - /pgf/number format/precision=3}, - legend style = { anchor=west}, - cycle list name = black white - ] - {% for algo in plot_data %} - {% if algo.scatter %} - \addplot [only marks] coordinates { - {% else %} - \addplot coordinates { - {% endif %} - {% for coord in algo.coords %} - ({{ coord[0]}}, {{ coord[1] }}) - {% endfor %} - }; - \addlegendentry{ {{algo.name}} }; - {% endfor %} - \end{axis} - \end{tikzpicture} - \caption{ {{caption}} } - \label{} -\end{figure} + +\begin{figure} + \centering + \begin{tikzpicture} + \begin{axis}[ + xlabel={ {{xlabel}} }, + ylabel={ {{ylabel}} }, + ymode = log, + yticklabel style={/pgf/number format/fixed, + /pgf/number format/precision=3}, + legend style = { anchor=west}, + cycle list name = black white + ] + {% for algo in plot_data %} + {% if algo.scatter %} + \addplot [only marks] coordinates { + {% else %} + \addplot coordinates { + {% endif %} + {% for coord in algo.coords %} + ({{ coord[0]}}, {{ coord[1] }}) + {% endfor %} + }; + \addlegendentry{ {{algo.name}} }; + {% endfor %} + \end{axis} + \end{tikzpicture} + \caption{ {{caption}} } + \label{} +\end{figure} diff --git a/templates/summary.html b/templates/summary.html index f83a7e1ea..271739014 100644 --- a/templates/summary.html +++ b/templates/summary.html @@ -1,14 +1,14 @@ -{% extends "general.html" %} -{% block content %} -
-

Billion-Scale Approximate Nearest Neighbor Search Challenge: NeurIPS'21 competition track

- -

- - - -{% endblock %} +{% extends "general.html" %} +{% block content %} +
+

Billion-Scale Approximate Nearest Neighbor Search Challenge: NeurIPS'21 competition track

+ +

+ + + +{% endblock %} diff --git a/tests/recall_tests.py b/tests/recall_tests.py deleted file mode 100755 index 95099a66d..000000000 --- a/tests/recall_tests.py +++ /dev/null @@ -1,243 +0,0 @@ -import numpy as np -import sys - -from benchmark.plotting.metrics import get_recall_values -from benchmark.datasets import DATASETS - -ASSERT= True # Stop unit tests on first failure - -GT_MIN_SIZE = 20 # Require ground truth with at least this length for each query - -def main_tests(): - # - # test recall computation on fake responses - # - - def test_recall( true_ids, true_dists, run_ids, count, expected_no_ties, expected_with_ties ): - '''This function will test the two forms of recall (with and without considering ties.)''' - - # compute recall, don't consider ties - recall = get_recall_values( (true_ids, true_dists), run_ids, count, False) - expected = 1.0 - print("compute recall(don't consider ties)=%f" % recall[0], "expected recall=%f" % expected_no_ties) - if ASSERT: - assert recall[0]==expected_no_ties - print("passed") - - # compute recall, consider ties - recall = get_recall_values( (true_ids, true_dists), run_ids, count, True) - expected = 1.0 - print("compute recall(consider ties)=%f num_queries_with_ties=%d" % (recall[0], recall[3]), "expected recall=%f" % expected_with_ties) - if ASSERT: - assert recall[0]==expected_with_ties - print("passed") - - print() - - print("TEST: fake query response with no distance ties, 1 query and k=3") - true_ids = np.array([ [ 0, 1, 2 ] ]) - true_dists = np.array([ [ 0.0, 1.0, 2.0 ] ]) - run_ids = np.array([ [ 0, 1, 2 ] ]) - count=3 - test_recall( true_ids, true_dists, run_ids, count, 1.0, 1.0 ) - - print("TEST: fake query response with no distance ties but not 1.0 recall, 1 query and k=3") - true_ids = np.array([ [ 0, 1, 2 ] ]) - true_dists = np.array([ [ 0.0, 1.0, 2.0 ] ]) - run_ids = np.array([ [ 0, 1, 3 ] ]) - count=3 - test_recall( true_ids, true_dists, run_ids, count, 2.0/3.0, 2.0/3.0 ) - - print("TEST: fake query response with no ties, 2 queries and k=3") - true_ids = np.array([ [ 0, 1, 2 ], [ 2, 1, 0 ] ]) - true_dists = np.array([ [ 0.0, 1.0, 2.0 ], [ 0.0, 1.0, 2.0 ] ]) - run_ids = np.array([ [ 0, 1, 2 ], [ 2, 1, 0 ] ]) - count=3 - test_recall( true_ids, true_dists, run_ids, count, 1.0, 1.0 ) - - print("TEST: fake query response with no distance ties, 1 query, k=3, GT array is larger than run array") - true_ids = np.array([ [ 0, 1, 2, 3 ] ]) - true_dists = np.array([ [ 0.0, 1.0, 2.0, 3.0 ] ]) - run_ids = np.array([ [ 0, 1, 2 ] ]) - count=3 - print("yuk true_ids=", true_ids.shape, "run_ids=", run_ids.shape) - test_recall( true_ids, true_dists, run_ids, count, 1.0, 1.0 ) - - print("TEST: fake query response with an out-of-bounds distance ties, 1 query, k=3, GT array is larger than run array.") - true_ids = np.array([ [ 0, 1, 2, 3 ] ]) - true_dists = np.array([ [ 0.0, 1.0, 2.0, 2.0 ] ]) - run_ids = np.array([ [ 0, 1, 2 ] ]) - count=3 - test_recall( true_ids, true_dists, run_ids, count, 1.0, 1.0 ) - - # this is from bigann GT and query set. The GT arrays are size=11 but run array is 10 and there are no ties to consider - print("TEST: from bigann-1B...") - true_ids = np.array([ [937541801, 221456167, 336118969, 971823307, 267986685, 544978851, 815975675, 615142927, 640142873, 994367459, 504814] ] ) - true_dists = np.array([ [55214., 58224., 58379., 58806., 59251., 59256., 60302., 60573., 60843., 60950., 61125.] ] ) - run_ids = np.array([ [221456167, 336118969, 971823307, 640142873, 994367459, 504814, 87356234, 628179290, 928121617, 397551598 ] ] ) - count=10 - test_recall( true_ids, true_dists, run_ids, count, 0.5, 0.5 ) - - print("TEST: fake query response with ties at beginning, 2 queries and k=3") - true_ids = np.array([ [ 0, 1, 2, 3 ], [ 3, 2, 1, 0 ] ]) - true_dists = np.array([ [ 0.0, 0.0, 1.0, 2.0 ], [ 0.0, 0.0, 1.0, 2.0 ] ]) - run_ids = np.array([ [ 0, 1, 3 ], [ 3, 2, 0 ] ]) - count=3 - test_recall( true_ids, true_dists, run_ids, count, np.mean([2.0,2.0])/count, np.mean([2.0,2.0])/count) - - print("TEST: fake query response with ties at beginning and ties have small diff, 2 queries and k=3") - true_ids = np.array([ [ 0, 1, 2, 3 ], [ 3, 2, 1, 0 ] ]) - true_dists = np.array([ [ 0.0, 0.0+1e-6-1e-7, 1.0, 2.0 ], [ 0.0, 0.0+1e-6-1e-7, 1.0, 2.0 ] ]) - run_ids = np.array([ [ 0, 1, 3 ], [ 3, 2, 0 ] ]) - count=3 - test_recall( true_ids, true_dists, run_ids, count, np.mean([2.0,2.0])/count, np.mean([2.0,2.0])/count) - - print("TEST: fake query response with possible ties at beginning but diff is just beyond the 1e-6 threshold, 2 queries and k=3") - true_ids = np.array([ [ 0, 1, 2, 3 ], [ 3, 2, 1, 0 ] ]) - true_dists = np.array([ [ 0.0, 0.0+1e-6, 1.0, 2.0 ], [ 0.0, 0.0+1e-6, 1.0, 2.0 ] ]) - run_ids = np.array([ [ 0, 1, 3 ], [ 3, 2, 0 ] ]) - count=3 - test_recall( true_ids, true_dists, run_ids, count, np.mean([2.0,2.0])/count, np.mean([2.0,2.0])/count ) - - print("TEST: fake query response with ties in middle, 2 queries and k=3") - true_ids = np.array([ [ 0, 1, 2, 3 ], [ 3, 2, 1, 0 ] ]) - true_dists = np.array([ [ 0.0, 1.0, 1.0, 2.0 ], [ 0.0, 1.0, 1.0, 2.0 ] ]) - run_ids = np.array([ [ 0, 1, 3 ], [ 3, 2, 0 ] ]) - count=3 - test_recall( true_ids, true_dists, run_ids, count, np.mean([2.0,2.0])/count, np.mean([2.0,2.0])/count) - - print("TEST: fake query response with ties at count-1 and 1 tie after, 2 queries and k=3") - true_ids = np.array([ [ 0, 1, 2, 3 ], [ 3, 2, 1, 0 ] ]) - true_dists = np.array([ [ 0.0, 1.0, 2.0, 2.0 ], [ 0.0, 1.0, 2.0, 2.0 ] ]) - run_ids = np.array([ [ 0, 1, 3 ], [ 3, 2, 0 ] ]) - count=3 - test_recall( true_ids, true_dists, run_ids, count, np.mean([2.0, 2.0])/float(count), np.mean([3.0, 3.0])/float(count) ) - - print("TEST: fake query response with ties at count-1 and 1 tie after and 1 after that that is cloe, 2 queries and k=3") - true_ids = np.array([ [ 0, 1, 2, 3 ], [ 3, 2, 1, 0 ] ]) - true_dists = np.array([ [ 0.0, 1.0, 2.0, 2.0 ], [ 0.0, 1.0, 2.0, 2.0 ] ]) - run_ids = np.array([ [ 0, 1, 3 ], [ 3, 2, 0 ] ]) - count=3 - test_recall( true_ids, true_dists, run_ids, count, np.mean([2.0, 2.0])/float(count), np.mean([3.0, 3.0])/float(count) ) - - print("TEST: fake query response with ties at count-1 and several close ties after, 2 queries and k=3") - true_ids = np.array([ [ 0, 1, 2, 3, 4, 5 ], [ 5, 4, 3, 2, 1, 0 ] ]) - true_dists = np.array([ [ 0.0, 1.0, 2.0, 2.0, 2.0+1e-6-1e-7, 2.0+1e-6 ], [ 0.0, 1.0, 2.0, 2.0, 2.0+1e-6-1e-7, 2.0+1e-6 ] ]) - run_ids = np.array([ [ 0, 1, 4 ], [ 5, 4, 0 ] ]) - count=3 - test_recall( true_ids, true_dists, run_ids, count, np.mean([2.0,2.0])/count, np.mean([3.0, 2.0])/float(count) ) - - print("TEST: fake query response with two independent tie groups, 2 queries and k=3") - true_ids = np.array([ [ 0, 1, 2, 3, 4, 5 ], [ 5, 4, 3, 2, 1, 0 ] ]) - true_dists = np.array([ [ 0.0, 0.0, 2.0, 3.0, 3.0, 4.0 ], [ 0.0, 0.0, 2.0, 3.0, 3.0, 4.0 ] ]) - run_ids = np.array([ [ 0, 1, 5 ], [ 5, 4, 1 ] ]) - count=3 - test_recall( true_ids, true_dists, run_ids, count, np.mean([2.0, 2.0])/float(count), np.mean([2.0, 2.0])/float(count) ) - - print("TEST: fake query response with two independent tie groups, 2 queries and k=4") - true_ids = np.array([ [ 0, 1, 2, 3, 4, 5, 6 ], [ 6, 5, 4, 3, 2, 1, 0 ] ]) - true_dists = np.array([ [ 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0 ], [ 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0 ] ]) - run_ids = np.array([ [ 0, 1, 5, 7 ], [ 5, 4, 1, 7 ] ]) - count=4 - test_recall( true_ids, true_dists, run_ids, count, np.mean([2.0, 2.0])/float(count), np.mean([2.0, 2.0])/float(count) ) - - # - # dataset tests - # - def test_GT_monotonicity( dset, increasing=True ): - print("TEST: %s, checking GT distances monotonicity" % dset) - dataset = DATASETS[dset]() - gt = dataset.get_groundtruth() - if ASSERT: assert len(gt)==2 - true_ids = gt[0] - true_dists = gt[1] - if ASSERT: - assert true_ids.shape[1]==true_dists.shape[1] - assert true_ids.shape[1]>=GT_MIN_SIZE - assert true_dists.shape[1]>=GT_MIN_SIZE - func = monotone_increasing if increasing else monotone_decreasing - for i in range(true_dists.shape[0]): - mtest = func(true_dists[i]) - if ASSERT: assert mtest==True - print() - - print("TEST: sanity check the monotone functions") - mtest = monotone_increasing([0,1,2,3,4,5]) - if ASSERT: assert mtest==True - mtest = monotone_increasing([0,0,0,3,4,5]) - if ASSERT: assert mtest==True - mtest = monotone_increasing([3,4,5,4,3,4,5]) - if ASSERT: assert mtest==False - mtest = monotone_increasing([5,4,4,3,2,1]) - if ASSERT: assert mtest==False - print() - - # check GT dist increasing monotonicity for each knn dataset - test_GT_monotonicity( "bigann-1B" ) - test_GT_monotonicity( "deep-1B" ) - test_GT_monotonicity( "msturing-1B" ) - test_GT_monotonicity( "msspacev-1B" ) - test_GT_monotonicity( "text2image-1B", increasing=False) - - # - # test recall on actual datasets - # - def extract_GT_monotonicity( dset, row, c1, c2): - print("TEST: %s, extraction" % dset, row, c1, c2) - dataset = DATASETS[dset]() - gt = dataset.get_groundtruth() - true_dists = gt[1] - lst = true_dists[row,c1:c2] - print(lst) - mtest = monotone_increasing(lst) - print(mtest) - print() - - def test_GT_as_query( dset, count ): - print("TEST: %s, using GT as query, k=10" % dset) - dataset = DATASETS[dset]() - gt = dataset.get_groundtruth() - if ASSERT: assert len(gt)==2 - true_ids = gt[0] - true_dists = gt[1] - if ASSERT: - assert true_ids.shape[1]==true_dists.shape[1] - assert true_ids.shape[1]>=GT_MIN_SIZE - assert true_dists.shape[1]>=GT_MIN_SIZE - run_ids = np.copy( gt[0] )[:,0:count] # create a query set from GT truncated at k - test_recall( true_ids, true_dists, run_ids, count, 1.0, 1.0 ) - - # test GT as query for each dataset - test_GT_as_query( "bigann-1B", 10 ) - test_GT_as_query( "deep-1B", 10 ) - test_GT_as_query( "text2image-1B", 10 ) - test_GT_as_query( "msturing-1B", 10 ) - test_GT_as_query( "msspacev-1B", 10 ) - - sys.exit(0) - - - -# -# useful functions -# -import itertools -import operator - -def monotone_increasing(lst): - pairs = zip(lst, lst[1:]) - bools = list(itertools.starmap(operator.le, pairs)) - #print(type(bools), len(bools), bools) - return all( bools ) - -def monotone_decreasing(lst): - pairs = zip(lst, lst[1:]) - bools = list(itertools.starmap(operator.ge, pairs)) - #print(type(lst), lst) - return all( bools ) - -def monotone(lst): - return monotone_increasing(lst) or monotone_decreasing(lst) - -if __name__ == "__main__": - main_tests() diff --git a/tests/tests.sh b/tests/tests.sh deleted file mode 100755 index 2e59a08d9..000000000 --- a/tests/tests.sh +++ /dev/null @@ -1,6 +0,0 @@ -#!/bin/bash - -# You should run this script from the repo top-level directory - -PYTHONPATH="." python tests/recall_tests.py - diff --git a/track1_baseline_faiss/README.md b/track1_baseline_faiss/README.md deleted file mode 100644 index 090f80ed2..000000000 --- a/track1_baseline_faiss/README.md +++ /dev/null @@ -1,170 +0,0 @@ -# Running the Faiss baselines - -## Installing software - -In addition to this repository, running the baseline code requires a conda install with Faiss - -```bash -wget https://repo.anaconda.com/archive/Anaconda3-2020.11-Linux-x86_64.sh - -bash Anaconda3-2020.11-Linux-x86_64.sh - -# follow instructions and run profile.sh to get a working conda - -conda create -n faiss_1.7.1 python=3.8 -conda activate faiss_1.7.1 -conda install -c pytorch faiss-cpu -``` - -All instructions below are supposed to be run from the root of the repository. -To make the package accessible, set `export PYTHONPATH=.` - -## Downloading the data - -To download the data (database files, query files and ground truth, do -``` -mkdir data/ # this is where all the data goes, a symlink is fine -python track1_baseline_faiss/baseline_faiss.py --dataset deep-1B --prepare -``` -The available datasets are bigann-1B deep-1B ssnpp-1B text2image-1B msturing-1B msspacev-1B. -To download the largest files, `--prepare` will use axel or azcopy. Make sure that they are in the path. - -Replace the -1B suffix with -100M or -10M to get a subset of each dataset (only the relevant fraction of the database will be downloaded). -This is useful for small-scale experiments. - -## Building the index - -There are several types of indexes in Faiss. -Here we focus on IVF variants with PQ compression as recommended [here](https://github.com/facebookresearch/faiss/wiki/Guidelines-to-choose-an-index#if-100m---1b-ivf1048576_hnsw32) and evaluated [here](https://github.com/facebookresearch/faiss/wiki/Indexing-1G-vectors#1b-datasets). - -The problem is that they require very large codebooks to define the IVF clusters. -This is fine (kind of) when a GPU is available to run the clustering, but not on CPU only. -Therefore, we perform a two-level clustering with n' = sqrt(ncentroids) first level cluster and n' clusterings of size n' at a refined level. -Then all n' * n' sub-clusters are indexed together in an IVF_HNSW. - -This writes like: - -```bash -python -u track1_baseline_faiss/baseline_faiss.py --dataset deep-1B \ - --indexkey OPQ64_128,IVF1048576_HNSW32,PQ64x4fsr \ - --maxtrain 100000000 \ - --two_level_clustering \ - --build \ - --add_splits 30 \ - --indexfile data/track1_baseline_faiss/deep-1B.IVF1M_2level_PQ64x4fsr.faissindex \ - --quantizer_efConstruction 200 \ - --quantizer_add_efSearch 80 -``` - -This works for deep-1B bigann-1B msturing-1B msspacev-1B. - -For ssnpp-1B, the type of index has to be adjusted a bit because the Faiss PQ64x4fsr does not support range search (see [the documentation of Faiss index types](https://github.com/facebookresearch/faiss/wiki/The-index-factory#encodings) for an explanation of the difference). - -Therefore, we use a slightly slower index type: PQ32. This gives: -```bash -python -u track1_baseline_faiss/baseline_faiss.py --dataset ssnpp-1B \ - --indexkey OPQ64_128,IVF1048576_HNSW32,PQ32 \ - --maxtrain 100000000 \ - --two_level_clustering \ - --build \ - --add_splits 30 \ - --indexfile data/track1_baseline_faiss/ssnpp-1B.IVF1M_2level_PQ23.faissindex \ - --quantizer_efConstruction 200 \ - --quantizer_add_efSearch 80 -``` - -The results on text2image-1B with the same index types are a lot worse. -This is probably due to the very lossy PQ compression. - -## Running the evaluation - -### Getting the pre-built indexes - -Pre-built indexes are available. -To download them - -```bash -wget https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/track1_baseline_faiss/deep-1B.IVF1M_2level_PQ64x4fsr.faissindex -P data/ -wget https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/track1_baseline_faiss/bigann-1B.IVF1M_2level_PQ64x4fsr.faissindex -P data/ -wget https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/track1_baseline_faiss/msturing-1B.IVF1M_2level_PQ64x4fsr.faissindex -P data/ -wget https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/track1_baseline_faiss/msspacev-1B.IVF1M_2level_PQ64x4fsr.faissindex -P data/ - -wget https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/track1_baseline_faiss/ssnpp-1B.IVF1M_2level_PQ32.faissindex -P data/ -wget https://dl.fbaipublicfiles.com/billion-scale-ann-benchmarks/track1_baseline_faiss/text2image-1B.IVF1M_2level_PQ32.faissindex -P data/ - -``` - - -### Running the evaluation - - - - -The evaluation proceeds by loading the index and looping over a set of search-time parameters that obtain different speed-accuracy tradeoffs. - -This writes as: -```bash - -params=" -nprobe=1,quantizer_efSearch=4 -nprobe=2,quantizer_efSearch=4 -... -nprobe=512,quantizer_efSearch=256 -nprobe=512,quantizer_efSearch=512 -nprobe=1024,quantizer_efSearch=512 -" - -python track1_baseline_faiss/baseline_faiss.py \ - --dataset deep-1B --indexfile data/deep-1B.IVF1M_2level_PQ64x4fsr.faissindex \ - --search --searchparams $params - -``` - -The sets of parameters per dataset are listed in [this GIST](https://gist.github.com/mdouze/bb71032f0b3bf3cc9bdaa6ff1287c144). -They are ordered from fastest / least accurate to slowest / most accurate. - -### Results - -The results should look like: - -``` -parameters inter@ 10 time(ms/q) nb distances #runs -nprobe=1,quantizer_efSearch=4 0.1738 0.00327 12210374 92 -nprobe=2,quantizer_efSearch=4 0.2394 0.00424 24328050 71 -nprobe=2,quantizer_efSearch=8 0.2879 0.00545 24278048 56 -... -nprobe=512,quantizer_efSearch=256 0.6877 0.75883 5896044691 1 -nprobe=512,quantizer_efSearch=512 0.6886 0.77421 5890639041 1 -nprobe=1024,quantizer_efSearch=512 0.6886 1.46841 11607413418 1 -``` - -This means that by setting the parameters `nprobe=2,quantizer_efSearch=4`, we obtain 0.2394 recall @ 10 (aka inter @10) for that dataset, the search will take 0.00327 ms per query (305810 QPS). -The total number of distances computed for all queries is 24328050 and this measurement was obtained in 71 runs (to reduce jitter in time measurements). - - -### Plots - -The speed-accuracy tradeoff plots are here (with 32 threads on a given 2.2Ghz machine): - -![](plots/bigann-1B.png) - -![](plots/deep-1B.png) - -![](plots/msturing-1B.png) - -![](plots/msspace-1B.png) - -![](plots/ssnpp-1B.png) - -![](plots/text2image-1B.png) - - -### Determining the optimal search-time parameters - -The Pareto-optimal parameter combinations can be obtained by a random exploration of the parameter space, as described [here](https://github.com/facebookresearch/faiss/wiki/Index-IO,-cloning-and-hyper-parameter-tuning#auto-tuning-the-runtime-parameters). -To perform this operation, do: -```bash -python track1_baseline_faiss/baseline_faiss.py \ - --dataset deep-1B --indexfile data/deep-1B.IVF1M_2level_PQ64x4fsr.faissindex \ - --search -``` diff --git a/track1_baseline_faiss/__init__.py b/track1_baseline_faiss/__init__.py deleted file mode 100644 index e69de29bb..000000000 diff --git a/track1_baseline_faiss/baseline_faiss.py b/track1_baseline_faiss/baseline_faiss.py deleted file mode 100644 index 4446401e2..000000000 --- a/track1_baseline_faiss/baseline_faiss.py +++ /dev/null @@ -1,791 +0,0 @@ -import os -import sys -import time -import pdb -import gc -import numpy as np -import faiss -import argparse -import resource - -import benchmark.datasets -from benchmark.datasets import DATASETS -from benchmark.plotting import eval_range_search - -#################################################################### -# Index building functions -#################################################################### - - -def two_level_clustering(xt, nc1, nc2, clustering_niter=25, spherical=False): - d = xt.shape[1] - - print(f"2-level clustering of {xt.shape} nb clusters = {nc1}*{nc2} = {nc1*nc2}") - print("perform coarse training") - - km = faiss.Kmeans( - d, nc1, verbose=True, niter=clustering_niter, - max_points_per_centroid=2000, - spherical=spherical - ) - km.train(xt) - - print() - - # coarse centroids - centroids1 = km.centroids - - print("assigning the training set") - t0 = time.time() - _, assign1 = km.assign(xt) - bc = np.bincount(assign1, minlength=nc1) - print(f"done in {time.time() - t0:.2f} s. Sizes of clusters {min(bc)}-{max(bc)}") - o = assign1.argsort() - del km - - # train sub-clusters - i0 = 0 - c2 = [] - t0 = time.time() - for c1 in range(nc1): - print(f"[{time.time() - t0:.2f} s] training sub-cluster {c1}/{nc1}\r", end="", flush=True) - i1 = i0 + bc[c1] - subset = o[i0:i1] - assert np.all(assign1[subset] == c1) - km = faiss.Kmeans(d, nc2, spherical=spherical) - xtsub = xt[subset] - km.train(xtsub) - c2.append(km.centroids) - i0 = i1 - print(f"done in {time.time() - t0:.2f} s") - return np.vstack(c2) - - -def unwind_index_ivf(index): - if isinstance(index, faiss.IndexPreTransform): - assert index.chain.size() == 1 - vt = faiss.downcast_VectorTransform(index.chain.at(0)) - index_ivf, vt2 = unwind_index_ivf(faiss.downcast_index(index.index)) - assert vt2 is None - return index_ivf, vt - if hasattr(faiss, "IndexRefine") and isinstance(index, faiss.IndexRefine): - return unwind_index_ivf(faiss.downcast_index(index.base_index)) - if isinstance(index, faiss.IndexIVF): - return index, None - else: - return None, None - - -def build_index(args, ds): - nq, d = ds.nq, ds.d - nb, d = ds.nq, ds.d - - if args.buildthreads == -1: - print("Build-time number of threads:", faiss.omp_get_max_threads()) - else: - print("Set build-time number of threads:", args.buildthreads) - faiss.omp_set_num_threads(args.buildthreads) - - metric_type = ( - faiss.METRIC_L2 if ds.distance() == "euclidean" else - faiss.METRIC_INNER_PRODUCT if ds.distance() in ("ip", "angular") else - 1/0 - ) - print("metric type", metric_type) - index = faiss.index_factory(d, args.indexkey, metric_type) - - index_ivf, vec_transform = unwind_index_ivf(index) - if vec_transform is None: - vec_transform = lambda x: x - else: - vec_transform = faiss.downcast_VectorTransform(vec_transform) - - if args.by_residual != -1: - by_residual = args.by_residual == 1 - print("setting by_residual = ", by_residual) - index_ivf.by_residual # check if field exists - index_ivf.by_residual = by_residual - - if index_ivf: - print("Update add-time parameters") - # adjust default parameters used at add time for quantizers - # because otherwise the assignment is inaccurate - quantizer = faiss.downcast_index(index_ivf.quantizer) - if isinstance(quantizer, faiss.IndexRefine): - print(" update quantizer k_factor=", quantizer.k_factor, end=" -> ") - quantizer.k_factor = 32 if index_ivf.nlist < 1e6 else 64 - print(quantizer.k_factor) - base_index = faiss.downcast_index(quantizer.base_index) - if isinstance(base_index, faiss.IndexIVF): - print(" update quantizer nprobe=", base_index.nprobe, end=" -> ") - base_index.nprobe = ( - 16 if base_index.nlist < 1e5 else - 32 if base_index.nlist < 4e6 else - 64) - print(base_index.nprobe) - elif isinstance(quantizer, faiss.IndexHNSW): - print(" update quantizer efSearch=", quantizer.hnsw.efSearch, end=" -> ") - if args.quantizer_add_efSearch > 0: - quantizer.hnsw.efSearch = args.quantizer_add_efSearch - else: - quantizer.hnsw.efSearch = 40 if index_ivf.nlist < 4e6 else 64 - print(quantizer.hnsw.efSearch) - if args.quantizer_efConstruction != -1: - print(" update quantizer efConstruction=", quantizer.hnsw.efConstruction, end=" -> ") - quantizer.hnsw.efConstruction = args.quantizer_efConstruction - print(quantizer.hnsw.efConstruction) - - - index.verbose = True - if index_ivf: - index_ivf.verbose = True - index_ivf.quantizer.verbose = True - index_ivf.cp.verbose = True - - - maxtrain = args.maxtrain - if maxtrain == 0: - if 'IMI' in args.indexkey: - maxtrain = int(256 * 2 ** (np.log2(index_ivf.nlist) / 2)) - elif index_ivf: - maxtrain = 50 * index_ivf.nlist - else: - # just guess... - maxtrain = 256 * 100 - maxtrain = max(maxtrain, 256 * 100) - print("setting maxtrain to %d" % maxtrain) - - # train on dataset - print(f"getting first {maxtrain} dataset vectors for training") - - xt2 = next(ds.get_dataset_iterator(bs=maxtrain)) - - print("train, size", xt2.shape) - assert np.all(np.isfinite(xt2)) - - t0 = time.time() - - if (isinstance(vec_transform, faiss.OPQMatrix) and - isinstance(index_ivf, faiss.IndexIVFPQFastScan)): - print(" Forcing OPQ training PQ to PQ4") - ref_pq = index_ivf.pq - training_pq = faiss.ProductQuantizer( - ref_pq.d, ref_pq.M, ref_pq.nbits - ) - vec_transform.pq - vec_transform.pq = training_pq - - if args.clustering_niter >= 0: - print(("setting nb of clustering iterations to %d" % - args.clustering_niter)) - index_ivf.cp.niter = args.clustering_niter - - train_index = None - if args.train_on_gpu: - print("add a training index on GPU") - train_index = faiss.index_cpu_to_all_gpus( - faiss.IndexFlatL2(index_ivf.d)) - index_ivf.clustering_index = train_index - - if args.two_level_clustering: - sqrt_nlist = int(np.sqrt(index_ivf.nlist)) - assert sqrt_nlist ** 2 == index_ivf.nlist - - centroids_trainset = xt2 - if isinstance(vec_transform, faiss.VectorTransform): - print(" training vector transform") - vec_transform.train(xt2) - print(" transform trainset") - centroids_trainset = vec_transform.apply_py(centroids_trainset) - - centroids = two_level_clustering( - centroids_trainset, sqrt_nlist, sqrt_nlist, - spherical=(metric_type == faiss.METRIC_INNER_PRODUCT) - ) - - if not index_ivf.quantizer.is_trained: - print(" training quantizer") - index_ivf.quantizer.train(centroids) - - print(" add centroids to quantizer") - index_ivf.quantizer.add(centroids) - - index.train(xt2) - print(" Total train time %.3f s" % (time.time() - t0)) - - if train_index is not None: - del train_index - index_ivf.clustering_index = None - gc.collect() - - print("adding") - - t0 = time.time() - if args.add_bs == -1: - index.add(sanitize(ds.get_database())) - else: - i0 = 0 - nsplit = args.add_splits - for sno in range(nsplit): - print(f"============== SPLIT {sno}/{nsplit}") - for xblock in ds.get_dataset_iterator(bs=args.add_bs, split=(nsplit, sno)): - i1 = i0 + len(xblock) - print(" adding %d:%d / %d [%.3f s, RSS %d kiB] " % ( - i0, i1, ds.nb, time.time() - t0, - faiss.get_mem_usage_kb())) - index.add(xblock) - i0 = i1 - gc.collect() - if sno == args.stop_at_split: - print("stopping at split", sno) - break - - print(" add in %.3f s" % (time.time() - t0)) - if args.indexfile: - print("storing", args.indexfile) - faiss.write_index(index, args.indexfile) - - return index - -#################################################################### -# Evaluation functions -#################################################################### - - -def compute_inter(a, b): - nq, rank = a.shape - ninter = sum( - np.intersect1d(a[i, :rank], b[i, :rank]).size - for i in range(nq) - ) - return ninter / a.size - -def knn_search_batched(index, xq, k, bs): - D, I = [], [] - for i0 in range(0, len(xq), bs): - Di, Ii = index.search(xq[i0:i0 + bs], k) - D.append(Di) - I.append(Ii) - return np.vstack(D), np.vstack(I) - -def eval_setting_knn(index, xq, gt, k=0, inter=False, min_time=3.0, query_bs=-1): - nq = xq.shape[0] - gt_I, gt_D = gt - - ivf_stats = faiss.cvar.indexIVF_stats - ivf_stats.reset() - nrun = 0 - t0 = time.time() - while True: - if query_bs == -1: - D, I = index.search(xq, k) - else: - D, I = knn_search_batched(index, xq, k, query_bs) - nrun += 1 - t1 = time.time() - if t1 - t0 > min_time: - break - ms_per_query = ((t1 - t0) * 1000.0 / nq / nrun) - - if inter: - rank = k - inter_measure = compute_inter(gt_I[:, :rank], I[:, :rank]) - print("%.4f" % inter_measure, end=' ') - else: - for rank in 1, 10, 100: - n_ok = (I[:, :rank] == gt_I[:, :1]).sum() - print("%.4f" % (n_ok / float(nq)), end=' ') - print(" %9.5f " % ms_per_query, end=' ') - - if ivf_stats.search_time == 0: - # happens for IVFPQFastScan where the stats are not logged by default - print("%12d %5.2f " % (ivf_stats.ndis / nrun, 0.0), end=' ') - else: - pc_quantizer = ivf_stats.quantization_time / ivf_stats.search_time * 100 - print("%12d %5.2f " % (ivf_stats.ndis / nrun, pc_quantizer), end=' ') - print(nrun) - -def eval_setting_range(index, xq, gt, radius=0, inter=False, min_time=3.0, query_bs=-1): - nq = xq.shape[0] - gt_nres, gt_I, gt_D = gt - gt_lims = np.zeros(nq + 1, dtype=int) - gt_lims[1:] = np.cumsum(gt_nres) - ivf_stats = faiss.cvar.indexIVF_stats - ivf_stats.reset() - nrun = 0 - t0 = time.time() - while True: - if query_bs == -1: - lims, D, I = index.range_search(xq, radius) - else: - raise NotImplemented - nrun += 1 - t1 = time.time() - if t1 - t0 > min_time: - break - ms_per_query = ((t1 - t0) * 1000.0 / nq / nrun) - - ap = eval_range_search.compute_AP((gt_lims, gt_I, gt_D), (lims, I, D)) - print("%.4f" % ap, end=' ') - print(" %9.5f " % ms_per_query, end=' ') - - print("%12d %5d " % (ivf_stats.ndis / nrun, D.size), end=' ') - print(nrun) - - -def result_header(ds, args): - - # setup the Criterion object - if ds.search_type() == "range": - header = ( - '%-40s AP time(ms/q) nb distances nb_res #runs' % - "parameters" - ) - crit = None - elif args.inter: - print("Optimize for intersection @ ", args.k) - crit = faiss.IntersectionCriterion(ds.nq, args.k) - header = ( - '%-40s inter@%3d time(ms/q) nb distances %%quantization #runs' % - ("parameters", args.k) - ) - else: - print("Optimize for 1-recall @ 1") - crit = faiss.OneRecallAtRCriterion(ds.nq, 1) - header = ( - '%-40s R@1 R@10 R@100 time(ms/q) nb distances %%quantization #runs' % - "parameters" - ) - return header, crit - -def op_compute_bounds(ps, ops, cno): - # lower_bound_t = 0.0 - # upper_bound_perf = 1.0 - bounds = np.array([0, 1], dtype="float64") - sp = faiss.swig_ptr - for i in range(ops.all_pts.size()): - ps.update_bounds(cno, ops.all_pts.at(i), sp(bounds[1:2]), sp(bounds[0:1])) - # lower_bound_t, upper_bound_perf - return bounds[0], bounds[1] - - - -def explore_parameter_space_range(index, xq, gt, ps, radius): - """ exploration of the parameter space for range search, using the - Average Precision as criterion - """ - - n_experiments = ps.n_experiments - n_comb = ps.n_combinations() - min_time = ps.min_test_duration - verbose = ps.verbose - - gt_nres, gt_I, gt_D = gt - gt_lims = np.zeros(len(gt_nres) + 1, dtype=int) - gt_lims[1:] = np.cumsum(gt_nres) - gt = (gt_lims, gt_I, gt_D) - - ops = faiss.OperatingPoints() - - def run_1_experiment(cno): - ps.set_index_parameters(index, cno) - - nrun = 0 - t0 = time.time() - while True: - lims, D, I = index.range_search(xq, radius) - nrun += 1 - t1 = time.time() - if t1 - t0 > min_time: - break - - t_search = (t1 - t0) / nrun - perf = eval_range_search.compute_AP(gt, (lims, I, D)) - keep = ops.add(perf, t_search, ps.combination_name(cno), cno) - - return len(D), perf, t_search, nrun, keep - - if n_experiments == 0: - # means exhaustive run - for cno in range(n_comb): - nres, perf, t_search, nrun, keep = run_1_experiment(cno) - - if verbose: - print(" %d/%d: %s nres=%d perf=%.3f t=%.3f s %s" % ( - cno, n_comb, - ps.combination_name(cno), - nres, perf, t_search, "*" if keep else "")) - return ops - - n_experiments = min(n_experiments, n_comb) - - perm = np.zeros(n_experiments, int) - # make sure the slowest and fastest experiment are run - perm[0] = 0 - perm[1] = n_comb - 1 - rs = np.random.RandomState(1234) - perm[2:] = 1 + rs.choice(n_comb - 2, n_experiments - 2, replace=False) - - for xp, cno in enumerate(perm): - cno = int(cno) - if verbose: - print(" %d/%d: cno=%d %s " % ( - xp, n_experiments, cno, ps.combination_name(cno)), - end="", flush=True) - - # check if we can skip this experiment - lower_bound_t, upper_bound_perf = op_compute_bounds(ps, ops, cno) - - best_t = ops.t_for_perf(upper_bound_perf) - - if verbose: - print("bounds [perf<=%.3f t>=%.3f] " % ( - upper_bound_perf, lower_bound_t), - end="skip\n" if best_t <= lower_bound_t else " " - ) - if best_t <= lower_bound_t: - continue - - nres, perf, t_search, nrun, keep = run_1_experiment(cno) - - if verbose: - print(" nres %d perf %.3f t %.3f (%d %s) %s" % ( - nres, perf, t_search, nrun, - "runs" if nrun >= 2 else "run", - "*" if keep else "")) - - return ops - - -#################################################################### -# Driver functions -#################################################################### - - - -def run_experiments_searchparams(ds, index, args): - """ - Evaluate a predefined set of runtime parameters - """ - k = args.k - xq = ds.get_queries() - - nq = len(xq) - - ps = faiss.ParameterSpace() - ps.initialize(index) - - header, _ = result_header(ds, args) - - searchparams = args.searchparams - - print(f"Running evaluation on {len(searchparams)} searchparams") - print(header) - maxw = max(max(len(p) for p in searchparams), 40) - for params in searchparams: - ps.set_index_parameters(index, params) - - print(params.ljust(maxw), end=' ') - sys.stdout.flush() - - if ds.search_type() == "knn": - eval_setting_knn( - index, xq, ds.get_groundtruth(k=args.k), - k=args.k, - inter=args.inter, min_time=args.min_test_duration, - query_bs=args.query_bs - ) - else: - eval_setting_range( - index, xq, ds.get_groundtruth(k=args.k), - radius=args.radius, - inter=args.inter, min_time=args.min_test_duration, - query_bs=args.query_bs - ) - - -def run_experiments_autotune(ds, index, args): - """ Explore the space of parameters and keep Pareto-optimal ones. """ - k = args.k - - xq = ds.get_queries() - nq = len(xq) - - ps = faiss.ParameterSpace() - ps.initialize(index) - - ps.n_experiments = args.n_autotune - ps.min_test_duration = args.min_test_duration - - for kv in args.autotune_max: - k, vmax = kv.split(':') - vmax = float(vmax) - print("limiting %s to %g" % (k, vmax)) - pr = ps.add_range(k) - values = faiss.vector_to_array(pr.values) - values = np.array([v for v in values if v < vmax]) - faiss.copy_array_to_vector(values, pr.values) - - for kv in args.autotune_range: - k, vals = kv.split(':') - vals = np.fromstring(vals, sep=',') - print("setting %s to %s" % (k, vals)) - pr = ps.add_range(k) - faiss.copy_array_to_vector(vals, pr.values) - - header, crit = result_header(ds, args) - - # then we let Faiss find the optimal parameters by itself - print("exploring operating points, %d threads" % faiss.omp_get_max_threads()); - ps.display() - - t0 = time.time() - - if ds.search_type() == "knn": - # by default, the criterion will request only 1 NN - crit.nnn = args.k - gt_I, gt_D = ds.get_groundtruth(k=args.k) - crit.set_groundtruth(None, gt_I.astype('int64')) - op = ps.explore(index, xq, crit) - elif ds.search_type() == "range": - op = explore_parameter_space_range( - index, xq, ds.get_groundtruth(), ps, args.radius - ) - else: - assert False - - print("Done in %.3f s, available OPs:" % (time.time() - t0)) - op.display() - - print("Re-running evaluation on selected OPs") - print(header) - opv = op.optimal_pts - maxw = max(max(len(opv.at(i).key) for i in range(opv.size())), 40) - for i in range(opv.size()): - opt = opv.at(i) - - ps.set_index_parameters(index, opt.key) - - print(opt.key.ljust(maxw), end=' ') - sys.stdout.flush() - if ds.search_type() == "knn": - eval_setting_knn( - index, xq, ds.get_groundtruth(k=args.k), - k=args.k, - inter=args.inter, min_time=args.min_test_duration - ) - else: - eval_setting_range( - index, xq, ds.get_groundtruth(k=args.k), - radius=args.radius, - inter=args.inter, min_time=args.min_test_duration - ) - - -class DatasetWrapInPairwiseQuantization: - - def __init__(self, ds, C): - self.ds = ds - self.C = C - self.Cq = np.linalg.inv(C.T) - # xb_pw = np.ascontiguousarray((C @ xb.T).T) - # xq_pw = np.ascontiguousarray((Cq @ xq.T).T) - # copy fields - - for name in "nb d nq dtype distance search_type get_groundtruth".split(): - setattr(self, name, getattr(ds, name)) - - def get_dataset(self): - return self.ds.get_dataset() @ self.C.T - - def get_queries(self): - return self.ds.get_queries() @ self.Cq.T - - def get_dataset_iterator(self, bs=512, split=(1,0)): - for xb in self.ds.get_dataset_iterator(bs=bs, split=split): - yield xb @ self.C.T - - -#################################################################### -# Main -#################################################################### - - -def main(): - - parser = argparse.ArgumentParser() - - def aa(*args, **kwargs): - group.add_argument(*args, **kwargs) - - group = parser.add_argument_group('What to do') - aa('--build', default=False, action="store_true") - aa('--search', default=False, action="store_true") - aa('--prepare', default=False, action="store_true", - help="call prepare() to download the dataset before computing") - - group = parser.add_argument_group('dataset options') - aa('--dataset', choices=DATASETS.keys(), required=True) - aa('--basedir', help="override basedir for dataset") - aa('--pairwise_quantization', default="", - help="load/store pairwise quantization matrix") - aa('--query_bs', default=-1, type=int, - help='perform queries in batches of this size') - - group = parser.add_argument_group('index construction') - - aa('--indexkey', default='HNSW32', help='index_factory type') - aa('--by_residual', default=-1, type=int, - help="set if index should use residuals (default=unchanged)") - aa('--M0', default=-1, type=int, help='size of base level') - aa('--maxtrain', default=0, type=int, - help='maximum number of training points (0 to set automatically)') - aa('--indexfile', default='', help='file to read or write index from') - aa('--add_bs', default=100000, type=int, - help='add elements index by batches of this size') - aa('--add_splits', default=1, type=int, - help="Do adds in this many splits (otherwise risk of OOM for large datasets)") - aa('--stop_at_split', default=-1, type=int, - help="stop at this split (for debugging)") - - aa('--no_precomputed_tables', action='store_true', default=False, - help='disable precomputed tables (uses less memory)') - aa('--clustering_niter', default=-1, type=int, - help='number of clustering iterations (-1 = leave default)') - aa('--two_level_clustering', action="store_true", default=False, - help='perform a 2-level tree clustering') - aa('--train_on_gpu', default=False, action='store_true', - help='do training on GPU') - aa('--quantizer_efConstruction', default=-1, type=int, - help="override the efClustering of the quantizer") - aa('--quantizer_add_efSearch', default=-1, type=int, - help="override the efSearch of the quantizer at add time") - aa('--buildthreads', default=-1, type=int, - help='nb of threads to use at build time') - - group = parser.add_argument_group('searching') - - aa('--k', default=10, type=int, help='nb of nearest neighbors') - aa('--radius', default=96237, type=float, help='radius for range search') - aa('--inter', default=True, action='store_true', - help='use intersection measure instead of 1-recall as metric') - aa('--searchthreads', default=-1, type=int, - help='nb of threads to use at search time') - aa('--searchparams', nargs='+', default=['autotune'], - help="search parameters to use (can be autotune or a list of params)") - aa('--n_autotune', default=500, type=int, - help="max nb of autotune experiments") - aa('--autotune_max', default=[], nargs='*', - help='set max value for autotune variables format "var:val" (exclusive)') - aa('--autotune_range', default=[], nargs='*', - help='set complete autotune range, format "var:val1,val2,..."') - aa('--min_test_duration', default=3.0, type=float, - help='run test at least for so long to avoid jitter') - aa('--parallel_mode', default=-1, type=int, - help="set search-time parallel mode for IVF indexes") - - group = parser.add_argument_group('computation options') - aa("--maxRAM", default=-1, type=int, help="set max RSS in GB (avoid OOM crash)") - - - args = parser.parse_args() - - print("args=", args) - - if args.basedir: - print("setting datasets basedir to", args.basedir) - benchmark.datasets.BASEDIR - benchmark.datasets.BASEDIR = args.basedir - - if args.maxRAM > 0: - print("setting max RSS to", args.maxRAM, "GiB") - resource.setrlimit( - resource.RLIMIT_DATA, (args.maxRAM * 1024 ** 3, resource.RLIM_INFINITY) - ) - - os.system('echo -n "nb processors "; ' - 'cat /proc/cpuinfo | grep ^processor | wc -l; ' - 'cat /proc/cpuinfo | grep ^"model name" | tail -1') - - ds = DATASETS[args.dataset]() - print(ds) - - nq, d = ds.nq, ds.d - nb, d = ds.nq, ds.d - - if args.prepare: - print("downloading dataset...") - ds.prepare() - print("dataset ready") - - if not (args.build or args.search): - return - - if args.pairwise_quantization: - if os.path.exists(args.pairwise_quantization): - print("loading pairwise quantization matrix", args.pairwise_quantization) - C = np.load(args.pairwise_quantization) - else: - print("training pairwise quantization") - xq_train = ds.get_query_train() - G = xq_train.T @ xq_train - C = np.linalg.cholesky(G).T - print("store matrix in", args.pairwise_quantization) - np.save(args.pairwise_quantization, C) - # Cq = np.linalg.inv(C.T) - # xb_pw = np.ascontiguousarray((C @ xb.T).T) - # xq_pw = np.ascontiguousarray((Cq @ xq.T).T) - ds = DatasetWrapInPairwiseQuantization(ds, C) - - if args.build: - print("build index, key=", args.indexkey) - index = build_index(args, ds) - else: - print("reading", args.indexfile) - index = faiss.read_index(args.indexfile) - - index_ivf, vec_transform = unwind_index_ivf(index) - if vec_transform is None: - vec_transform = lambda x: x - - if index_ivf is not None: - print("imbalance_factor=", index_ivf.invlists.imbalance_factor()) - - if args.no_precomputed_tables: - if isinstance(index_ivf, faiss.IndexIVFPQ): - print("disabling precomputed table") - index_ivf.use_precomputed_table = -1 - index_ivf.precomputed_table.clear() - - if args.indexfile: - print("index size on disk: ", os.stat(args.indexfile).st_size) - - print("current RSS:", faiss.get_mem_usage_kb() * 1024) - - precomputed_table_size = 0 - if hasattr(index_ivf, 'precomputed_table'): - precomputed_table_size = index_ivf.precomputed_table.size() * 4 - - print("precomputed tables size:", precomputed_table_size) - - if args.search: - - if args.searchthreads == -1: - print("Search threads:", faiss.omp_get_max_threads()) - else: - print("Setting nb of threads to", args.searchthreads) - faiss.omp_set_num_threads(args.searchthreads) - - if args.parallel_mode != -1: - print("setting IVF parallel mode to", args.parallel_mode) - index_ivf.parallel_mode - index_ivf.parallel_mode = args.parallel_mode - - if args.searchparams == ["autotune"]: - run_experiments_autotune(ds, index, args) - else: - run_experiments_searchparams(ds, index, args) - - -if __name__ == "__main__": - main() diff --git a/track1_baseline_faiss/parse_results.py b/track1_baseline_faiss/parse_results.py deleted file mode 100644 index 48e3411ac..000000000 --- a/track1_baseline_faiss/parse_results.py +++ /dev/null @@ -1,99 +0,0 @@ -""" -Parse log files from baseline_faiss.py - -""" -import os -import numpy as np - - - -def parse_result_file(fname): - # print fname - st = 0 - res = [] - keys = [] - stats = {} - stats['run_version'] = fname[-8] - indexkey = None - for l in open(fname): - if l.startswith("srun:"): - # looks like a crash... - if indexkey is None: - raise RuntimeError("instant crash") - break - elif st == 0: - if l.startswith("dataset in dimension"): - fi = l.split() - stats["d"] = int(fi[3][:-1]) - stats["nq"] = int(fi[9]) - stats["nb"] = int(fi[11]) - stats["nt"] = int(fi[13]) - if l.startswith('index size on disk:'): - stats['index_size'] = int(l.split()[-1]) - if l.startswith('current RSS:'): - stats['RSS'] = int(l.split()[-1]) - if l.startswith('precomputed tables size:'): - stats['tables_size'] = int(l.split()[-1]) - if l.startswith('Setting nb of threads to'): - stats['n_threads'] = int(l.split()[-1]) - if l.startswith(' add in'): - stats['add_time'] = float(l.split()[-2]) - if l.startswith('args:'): - args = eval(l[l.find(' '):]) - indexkey = args.indexkey - if l.startswith('build index, key='): - indexkey = l.split()[-1] - elif "time(ms/q)" in l: - # result header - if 'R@1 R@10 R@100' in l: - stats["measure"] = "recall" - stats["ranks"] = [1, 10, 100] - elif 'I@1 I@10 I@100' in l: - stats["measure"] = "inter" - stats["ranks"] = [1, 10, 100] - elif 'inter@' in l: - stats["measure"] = "inter" - fi = l.split() - if fi[1] == "inter@": - rank = int(fi[2]) - else: - rank = int(fi[1][len("inter@"):]) - stats["ranks"] = [rank] - elif 'AP' in l: - stats["measure"] = "average_precision" - else: - assert False - st = 1 - elif 'index size on disk:' in l: - stats["index_size"] = int(l.split()[-1]) - elif st == 1: - st = 2 - elif st == 2: - fi = l.split() - if l[0] == " ": - # means there are 0 parameters - fi = [""] + fi - keys.append(fi[0]) - if len(fi[1:]) > 0: - res.append([float(x) for x in fi[1:]]) - return indexkey, np.array(res), keys, stats - - -def find_latest_version(fname): - """ all log files are called - XX.a.log - XX.b.log - - Where XX is the experiment id and a, b... are versions. - The version is used when the same experiment needs to be - redone because it failed. This function returns the latest version - """ - assert fname.endswith(".log") - pref = fname[:-5] - lv = "" - for suf in "abcdefghijklmnopqrs": - fname = pref + suf + '.log' - if os.path.exists(fname): - lv = fname - assert lv - return lv \ No newline at end of file diff --git a/track1_baseline_faiss/plots/bigann-1B.png b/track1_baseline_faiss/plots/bigann-1B.png deleted file mode 100644 index 7a1d4a5b7..000000000 Binary files a/track1_baseline_faiss/plots/bigann-1B.png and /dev/null differ diff --git a/track1_baseline_faiss/plots/deep-1B.png b/track1_baseline_faiss/plots/deep-1B.png deleted file mode 100644 index 0c6bfc32e..000000000 Binary files a/track1_baseline_faiss/plots/deep-1B.png and /dev/null differ diff --git a/track1_baseline_faiss/plots/msspacev-1B.png b/track1_baseline_faiss/plots/msspacev-1B.png deleted file mode 100644 index a8f0c5fda..000000000 Binary files a/track1_baseline_faiss/plots/msspacev-1B.png and /dev/null differ diff --git a/track1_baseline_faiss/plots/msturing-1B.png b/track1_baseline_faiss/plots/msturing-1B.png deleted file mode 100644 index 2363edcd2..000000000 Binary files a/track1_baseline_faiss/plots/msturing-1B.png and /dev/null differ diff --git a/track1_baseline_faiss/plots/ssnpp-1B.png b/track1_baseline_faiss/plots/ssnpp-1B.png deleted file mode 100644 index 96e1b9720..000000000 Binary files a/track1_baseline_faiss/plots/ssnpp-1B.png and /dev/null differ diff --git a/track1_baseline_faiss/plots/text2image-1B.png b/track1_baseline_faiss/plots/text2image-1B.png deleted file mode 100644 index 5f7b9b302..000000000 Binary files a/track1_baseline_faiss/plots/text2image-1B.png and /dev/null differ diff --git a/track1_baseline_faiss/run_baselines.bash b/track1_baseline_faiss/run_baselines.bash deleted file mode 100644 index 62901423f..000000000 --- a/track1_baseline_faiss/run_baselines.bash +++ /dev/null @@ -1,530 +0,0 @@ -set -e - -export PYTHONPATH=. - - - - -function run_on () { - local sbatch_opt="$1" - shift - local name=$1 - shift - local torun=" $@ " - - if [ -e slurm_scripts/$name.sh ]; then - echo "script" slurm_scripts/$name.sh exists - exit 1 - fi - - echo -n $name " " - - echo $@ > slurm_scripts/$name.sh - - sbatch $sbatch_opt \ - -J $name -o logs/$name.log \ - --wrap "bash slurm_scripts/$name.sh" - -} - - -function run_on_1gpu () { - run_on "--gres=gpu:1 --ntasks=1 --time=30:00:00 --cpus-per-task=20 - --partition=devlab --mem=64g --nodes=1 " "$@" -} - -function run_on_1gpu_learnlab () { - run_on "--gres=gpu:1 --ntasks=1 --time=30:00:00 --cpus-per-task=20 - --partition=learnlab --mem=64g --nodes=1 " "$@" -} -function run_on_half_machine () { - run_on "--gres=gpu:1 --ntasks=1 --time=30:00:00 --cpus-per-task=40 - --partition=learnlab --mem=256g --nodes=1 " "$@" -} - -function run_on_2gpu_ram256 () { - run_on "--gres=gpu:2 --ntasks=1 --time=30:00:00 --cpus-per-task=20 - --partition=learnlab --mem=256g --nodes=1 " "$@" -} - - - -############################################################## -# Small scale experiments to evaluate effect of 2-level clustering -############################################################## - -# compare 2-level 65k clustering index and regular one - -basedir=data/track1_baseline_faiss - - -if false; then - -dsname=bigann-10M - - -run_on_1gpu $dsname.IVF65k_HNSW.a \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.faissindex \ - --indexkey PCAR64,IVF65536_HNSW32,Flat --maxtrain $((65536 * 50)) \ - --search --train_on_gpu - - -run_on_1gpu $dsname.IVF65k_2level_HNSW.b \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.IVF65k_2level_HNSW.faissindex \ - --indexkey PCAR64,IVF65536_HNSW32,Flat --maxtrain $((65536 * 50)) \ - --two_level_clustering \ - --search - - - - -# for efC in 50 100 200; do - -for efC in 400 800; do - -run_on_1gpu $dsname.IVF65k_HNSW_efC$efC.b \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.IVF65k_HNSW_efC$efC.faissindex \ - --indexkey PCAR64,IVF65536_HNSW32,Flat --maxtrain $((65536 * 50)) \ - --quantizer_efConstruction $efC \ - --build --search --train_on_gpu - -done - - - -# for efS in 20 40 80; do -for efS in 160 320; do - -name=$dsname.IVF65k_2level_HNSW_efC200_efS$efS - -run_on_1gpu $name.a \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$name.faissindex \ - --indexkey PCAR64,IVF65536_HNSW32,Flat --maxtrain $((65536 * 50)) \ - --quantizer_efConstruction 200 \ - --quantizer_add_efSearch $efS \ - --two_level_clustering \ - --build --search - -done - - - - -############################################################## -# Experiments on scale 100M -############################################################## - -# .a: build -# .c: eval w 32 threads - -# start with least problematic datasets (no IP search, no range search) -# msspace-1B may need to redo experiments because of ties in distance computations -for dsname in bigann-100M deep-100M msturing-100M msspacev-100M; do - - for nc in 256k 1M; do - - case $nc in - 1M) ncn=$((1<<20)) ;; - 256k) ncn=$((1<<18)) ;; - esac - - name=$dsname.IVF${nc}_2level_PQ32 - - run_on_half_machine $name.c \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$name.faissindex \ - --indexkey OPQ32_128,IVF${ncn}_HNSW32,PQ32 \ - --maxtrain 100000000 \ - --quantizer_efConstruction 200 \ - --quantizer_add_efSearch 80 \ - --two_level_clustering \ - --search --searchthreads 32 \ - --maxRAM 256 - - name=$dsname.IVF${nc}_2level_PQ64x4fsr - - run_on_half_machine $name.c \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$name.faissindex \ - --indexkey OPQ64_128,IVF${ncn}_HNSW32,PQ64x4fsr \ - --maxtrain 100000000 \ - --quantizer_efConstruction 200 \ - --quantizer_add_efSearch 80 \ - --two_level_clustering \ - --search --searchthreads 32 \ - --maxRAM 256 - - done - -done - - -############################################################## -# Experiments on scale 1B -############################################################## - -# .a: build -# .b: eval w 32 threads -# .c: redo bigann eval -# .d: with ssnpp, forgot to build... -# .f: redo t2i 64x4 (eval only) - -# start with least problematic datasets (no IP search, no range search) -# msspace-1B may need to redo experiments because of ties in distance computations - -# for dsname in bigann-1B deep-1B msturing-1B msspacev-1B; do -# for dsname in bigann-1B; do -# for dsname in ssnpp-1B; do -# for nc in 1M 4M; do - -fi - -for dsname in text2image-1B; do - - for nc in 1M; do - - case $nc in - 1M) ncn=$((1<<20)) ;; - 4M) ncn=$((1<<22)) ;; - esac - - if false ;then - - name=$dsname.IVF${nc}_2level_PQ32 - - run_on_half_machine $name.e \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$name.faissindex \ - --indexkey OPQ32_128,IVF${ncn}_HNSW32,PQ32 \ - --maxtrain 100000000 \ - --quantizer_efConstruction 200 \ - --quantizer_add_efSearch 80 \ - --two_level_clustering \ - --build --search --searchthreads 32 \ - --maxRAM 256 - - fi - name=$dsname.IVF${nc}_2level_PQ64x4fsr - - run_on_half_machine $name.g \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$name.faissindex \ - --indexkey OPQ64_128,IVF${ncn}_HNSW32,PQ64x4fsr \ - --maxtrain 100000000 \ - --quantizer_efConstruction 200 \ - --quantizer_add_efSearch 80 \ - --two_level_clustering \ - --search --searchthreads 32 \ - --maxRAM 256 --autotune_max nprobe:513 - - - done - -done - -if false; then - -# speed up construction - -dsname=ssnpp-1B -nc=1M -ncn=$((1<<20)) - -name=$dsname.IVF${nc}_2level_aefS40_PQ32 - -un_on_half_machine $name.d \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$name.faissindex \ - --indexkey OPQ32_128,IVF${ncn}_HNSW32,PQ32 \ - --maxtrain 100000000 \ - --quantizer_efConstruction 200 \ - --quantizer_add_efSearch 40 \ - --add_splits 30 \ - --two_level_clustering \ - --build --search --searchthreads 32 \ - --maxRAM 256 - - -# find a way to not OOM during autotune - -function ssnpp_no_OOM () { - local key=$1 - shift - dsname=ssnpp-1B - nc=1M - ncn=$((1<<20)) - - name=$dsname.IVF${nc}_2level_PQ32.search.$key - - run_on_half_machine $name.a \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.IVF${nc}_2level_PQ32.faissindex \ - --search --searchthreads 32 \ - --maxRAM 256 "$@" -} - -ssnpp_no_OOM radius75000 --radius 75000 -ssnpp_no_OOM radius80000 --radius 80000 -ssnpp_no_OOM radius60000 --radius 60000 -ssnpp_no_OOM maxNP1024 --autotune_max nprobe:1025 -ssnpp_no_OOM maxEFS256 --autotune_max quantizer_efSearch:257 - - - -############################################################## -# Experiments with 64 bytes per vector -############################################################## - -# .a: initial run and build -# .b: re-run to get more detailed search stats - - -for dsname in bigann-1B deep-1B msturing-1B msspacev-1B; do - nc=1M - ncn=$((1<<20)) - - name=$dsname.IVF${nc}_2level_PQ64 - - run_on_half_machine $name.b \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$name.faissindex \ - --indexkey OPQ64_128,IVF${ncn}_HNSW32,PQ64 \ - --maxtrain 100000000 \ - --quantizer_efConstruction 200 \ - --quantizer_add_efSearch 80 \ - --two_level_clustering \ - --search --searchthreads 32 \ - --maxRAM 256 - - name=$dsname.IVF${nc}_2level_PQ128x4fsr - - run_on_half_machine $name.b \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$name.faissindex \ - --indexkey OPQ128_128,IVF${ncn}_HNSW32,PQ128x4fsr \ - --maxtrain 100000000 \ - --quantizer_efConstruction 200 \ - --quantizer_add_efSearch 80 \ - --two_level_clustering \ - --search --searchthreads 32 \ - --maxRAM 256 - -done - - - -############################################################## -# 10M scale exeperiment for text2image -############################################################## - -dsname=text2image-10M - - -for nc in 16k 65k; do - - case $nc in - 16k) ncn=$((1<<14)) ;; - 65k) ncn=$((1<<16)) ;; - esac - - # baseline - key=IVF$nc - run_on_1gpu $dsname.$key.d \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.$key.faissindex \ - --indexkey IVF${ncn},Flat --maxtrain $((ncn * 4 * 50)) \ - --build --search --train_on_gpu - - # loss due to 2-level - key=IVF${nc}_2level - run_on_1gpu $dsname.$key.d \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.$key.faissindex \ - --indexkey IVF${ncn},Flat --maxtrain $((ncn * 4 * 50)) \ - --build --search --two_level_clustering - - # loss due to HNSW - key=IVF${nc}_HNSW - run_on_1gpu $dsname.$key.d \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.$key.faissindex \ - --indexkey IVF${ncn}_HNSW32,Flat --maxtrain $((ncn * 4 * 50)) \ - --quantizer_efConstruction 200 \ - --quantizer_add_efSearch 80 \ - --build --search --train_on_gpu - - # loss due to 2-level + HNSW - key=IVF${nc}_2level_HNSW - run_on_1gpu $dsname.$key.d \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.$key.faissindex \ - --indexkey IVF${ncn}_HNSW32,Flat --maxtrain $((ncn * 4 * 50)) \ - --quantizer_efConstruction 200 \ - --quantizer_add_efSearch 80 \ - --build --search --two_level_clustering - -done - -# evaluate various IVF codes - -ncn=16384 - - -key=IVF16k,SQ8 -run_on_1gpu_learnlab $dsname.$key.b \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.$key.faissindex \ - --indexkey RR200,IVF16384,SQ8 --maxtrain $((ncn * 4 * 50)) \ - --build --search --train_on_gpu - -key=IVF16k,SQ8_nores -run_on_1gpu_learnlab $dsname.$key.b \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.$key.faissindex \ - --indexkey RR200,IVF16384,SQ8 --maxtrain $((ncn * 4 * 50)) \ - --build --search --train_on_gpu --by_residual 0 - -key=IVF16k,SQ6 -run_on_1gpu_learnlab $dsname.$key.b \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.$key.faissindex \ - --indexkey RR200,IVF16384,SQ6 --maxtrain $((ncn * 4 * 50)) \ - --build --search --train_on_gpu - -key=IVF16k,SQ6_nores -run_on_1gpu_learnlab $dsname.$key.b \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.$key.faissindex \ - --indexkey RR200,IVF16384,SQ6 --maxtrain $((ncn * 4 * 50)) \ - --build --search --train_on_gpu --by_residual 0 - - -key=IVF16k,SQ8_PQ32 -run_on_1gpu_learnlab $dsname.$key.a \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.$key.faissindex \ - --indexkey OPQ32_128,IVF16384,PQ32 --maxtrain $((ncn * 4 * 50)) \ - --build --search --train_on_gpu - -key=IVF16k,SQ8_PQ32_nores -run_on_1gpu_learnlab $dsname.$key.a \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.$key.faissindex \ - --indexkey OPQ32_128,IVF16384,PQ32 --maxtrain $((ncn * 4 * 50)) \ - --build --search --train_on_gpu --by_residual 0 - - -key=IVF16k,SQ4 -run_on_1gpu_learnlab $dsname.$key.b \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.$key.faissindex \ - --indexkey RR200,IVF16384,SQ4 --maxtrain $((ncn * 4 * 50)) \ - --build --search --train_on_gpu - -key=IVF16k,SQ4_PCAR100 -run_on_1gpu_learnlab $dsname.$key.b \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.$key.faissindex \ - --indexkey PCAR100,IVF16384,SQ4 --maxtrain $((ncn * 4 * 50)) \ - --build --search --train_on_gpu - -key=IVF16k,RR192_PQ32 -run_on_1gpu_learnlab $dsname.$key.b \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.$key.faissindex \ - --indexkey RR192,IVF16384,PQ32 --maxtrain $((ncn * 4 * 50)) \ - --build --search --train_on_gpu - -key=IVF16k,RR192_PQ32x12 -run_on_1gpu_learnlab $dsname.$key.b \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.$key.faissindex \ - --indexkey RR192,IVF16384,PQ32x12 --maxtrain $((ncn * 4 * 50)) \ - --build --search --train_on_gpu - - -dsname=text2image-10M - -key=IVF16k,PQ48 -run_on_1gpu $dsname.$key.c \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.$key.faissindex \ - --indexkey OPQ48_192,IVF16384,PQ48 --maxtrain $((65536 * 50)) \ - --search --train_on_gpu - -key=IVF16k,PQ64 -run_on_1gpu $dsname.$key.c \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.$key.faissindex \ - --indexkey OPQ64_192,IVF16384,PQ64 --maxtrain $((65536 * 50)) \ - --search --train_on_gpu - - -dsname=text2image-10M -key=IVF16k,PQ48 -run_on_1gpu $dsname.$key.c \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.$key.faissindex \ - --indexkey OPQ48_192,IVF16384,PQ48 --maxtrain $((65536 * 50)) \ - --search --train_on_gpu - - - -## try out additive quants - - -export PYTHONPATH=/private/home/matthijs/faiss_versions/faiss_add_quant_search/build/faiss/python/build/lib:. -dsname=text2image-10M -for key in IVF16384,RQ32x8_Nfloat IVF16384,RQ31x8_Nqint8 IVF16384,LSQ32x8_Nfloat IVF16384,LSQ31x8_Nqint8 ; do -run_on_1gpu $dsname.$key.g \ - python -u track1_baseline_faiss/baseline_faiss.py \ - --dataset $dsname --indexfile $basedir/$dsname.$key.faissindex \ - --indexkey $key --maxtrain $((65536 * 50)) \ - --search --build # --train_on_gpu - -done - - -############################################################## -# GPU based search (T3) -############################################################## - -basedir=data/track3_baseline_faiss -dsname=deep-1B - -#.a: run with a too tight limit in RAM -#.b: increased RAM - -key=IVF262k,PQ8 -run_on_2gpu_ram256 T3.$dsname.$key.b \ - python -u track3_baseline_faiss/gpu_baseline_faiss.py \ - --maxRAM 256 \ - --dataset $dsname --indexkey IVF$((1<<18)),SQ8 \ - --build \ - --searchparams nprobe={1,4,16,64,256,1024} \ - --train_on_gpu --quantizer_on_gpu_add \ - --indexfile $basedir/$dsname.$key.faissindex \ - --add_splits 30 \ - --search \ - --parallel_mode 3 --quantizer_on_gpu_search - - -key=IVF1M,PQ8 -run_on_2gpu_ram256 T3.$dsname.$key.b \ - python -u track3_baseline_faiss/gpu_baseline_faiss.py \ - --maxRAM 256 \ - --dataset $dsname --indexkey IVF$((1<<20)),SQ8 \ - --build \ - --searchparams nprobe={1,4,16,64,256,1024} \ - --train_on_gpu --quantizer_on_gpu_add \ - --indexfile $basedir/$dsname.$key.faissindex \ - --add_splits 30 \ - --search \ - --parallel_mode 3 --quantizer_on_gpu_search - - -fi \ No newline at end of file diff --git a/track3_baseline_faiss/README.md b/track3_baseline_faiss/README.md deleted file mode 100644 index 903e6b9fb..000000000 --- a/track3_baseline_faiss/README.md +++ /dev/null @@ -1,73 +0,0 @@ -# Running the Faiss GPU baseline - -The script here is based on the T1 baseline, so please take a look at [the Track 1 baseline](../track1_baseline_faiss/README.md) first. - -## Installing software - -See [this doc](../track1_baseline_faiss/README.md#installing-software) but instead of installing faiss-cpu, use: - -``` -conda install -c pytorch faiss-gpu cudatoolkit=10.2 -``` - -## How to use the GPU - -This script focuses on exploiting the GPU for coarse quantization. -Therefore, it is suitable for large codebooks. - -The GPU can be used in the following phases: - -- training: `--train_with_gpu` will move the training of the coarse quantizer to GPU - -- vector adding to the index: `--quantizer_on_gpu_add --` will do the adding on GPU - -- search: `--parallel_mode 3 --quantizer_on_gpu_search` will do coarse quantization on GPU at search time. - -## Building the index and searching - -The hardware environment is: 1 GPU on a machine with 768G RAM (practically unlimited). -Therefore, the approach is to do the coarse quantization on GPU and store the IVF index in RAM with mild compression (PQ8). -This means that to keep the GPU busy the number of centroids should be as large as possible. -We use 1M in the example below. -The GPU uses brute force computations to find the nearest centroids. - -### 100M-scale - -The following command runs the index constuction and evaluates the search performance: - -```bash -python track3_baseline_faiss/gpu_baseline_faiss.py --dataset deep-100M \ - --indexkey IVF65536,SQ8 \ - --train_on_gpu \ - --build --quantizer_on_gpu_add --add_splits 30 \ - --search \ - --searchparams nprobe={1,4,16,64,256} \ - --parallel_mode 3 --quantizer_on_gpu_search -``` - -Example logs [without GPU](https://gist.github.com/mdouze/9e000be47c499f79aaec0166365ef654) and [with GPU](https://gist.github.com/mdouze/cd14c802b924299aa2a92db6e05df857) at search time. - - -### 1B-scale - -```bash -python track3_baseline_faiss/gpu_baseline_faiss.py --dataset deep-1B \ - --indexkey IVF$((1<<18)),SQ8 \ - --train_on_gpu \ - --build --quantizer_on_gpu_add --add_splits 30 \ - --search \ - --searchparams nprobe={1,4,16,64,256} \ - --parallel_mode 3 --quantizer_on_gpu_search -``` - - -For the SSNPP dataset, please use `--parallel_mode 2` instead. - - -### Results - -Similar to the track 1 results, we can plot the GPU search results in a plot of recall@10 vs. QPS. - -![](plots/T3_deep-1B.png) - -Caveat: here the GPU uses 20 CPU threads vs. 32 for the CPU, and the search is actually performed on 2 GPUs. diff --git a/track3_baseline_faiss/gpu_baseline_faiss.py b/track3_baseline_faiss/gpu_baseline_faiss.py deleted file mode 100644 index a3fc2d1e8..000000000 --- a/track3_baseline_faiss/gpu_baseline_faiss.py +++ /dev/null @@ -1,574 +0,0 @@ -import os -import sys -import time -import pdb -import gc -import numpy as np -import faiss -import argparse -import resource -import threading -from multiprocessing.pool import ThreadPool - -import benchmark.datasets -from benchmark.datasets import DATASETS -from benchmark.plotting import eval_range_search - - - -def unwind_index_ivf(index): - if isinstance(index, faiss.IndexPreTransform): - assert index.chain.size() == 1 - vt = index.chain.at(0) - index_ivf, vt2 = unwind_index_ivf(faiss.downcast_index(index.index)) - assert vt2 is None - return index_ivf, vt - if hasattr(faiss, "IndexRefine") and isinstance(index, faiss.IndexRefine): - return unwind_index_ivf(faiss.downcast_index(index.base_index)) - if isinstance(index, faiss.IndexIVF): - return index, None - else: - return None, None - -def rate_limited_iter(l): - 'a thread pre-processes the next element' - pool = ThreadPool(1) - res = None - - def next_or_None(): - try: - return next(l) - except StopIteration: - return None - - while True: - res_next = pool.apply_async(next_or_None) - if res is not None: - res = res.get() - if res is None: - return - yield res - res = res_next - - -def build_index(args, ds): - nq, d = ds.nq, ds.d - nb, d = ds.nq, ds.d - - if args.buildthreads == -1: - print("Build-time number of threads:", faiss.omp_get_max_threads()) - else: - print("Set build-time number of threads:", args.buildthreads) - faiss.omp_set_num_threads(args.buildthreads) - - metric_type = ( - faiss.METRIC_L2 if ds.distance() == "euclidean" else - faiss.METRIC_INNER_PRODUCT if ds.distance() in ("ip", "angular") else - 1/0 - ) - index = faiss.index_factory(d, args.indexkey, metric_type) - - index_ivf, vec_transform = unwind_index_ivf(index) - if vec_transform is None: - vec_transform = lambda x: x - else: - vec_transform = faiss.downcast_VectorTransform(vec_transform) - - if args.by_residual != -1: - by_residual = args.by_residual == 1 - print("setting by_residual = ", by_residual) - index_ivf.by_residual # check if field exists - index_ivf.by_residual = by_residual - - if index_ivf: - print("Update add-time parameters") - # adjust default parameters used at add time for quantizers - # because otherwise the assignment is inaccurate - quantizer = faiss.downcast_index(index_ivf.quantizer) - if isinstance(quantizer, faiss.IndexRefine): - print(" update quantizer k_factor=", quantizer.k_factor, end=" -> ") - quantizer.k_factor = 32 if index_ivf.nlist < 1e6 else 64 - print(quantizer.k_factor) - base_index = faiss.downcast_index(quantizer.base_index) - if isinstance(base_index, faiss.IndexIVF): - print(" update quantizer nprobe=", base_index.nprobe, end=" -> ") - base_index.nprobe = ( - 16 if base_index.nlist < 1e5 else - 32 if base_index.nlist < 4e6 else - 64) - print(base_index.nprobe) - - index.verbose = True - if index_ivf: - index_ivf.verbose = True - index_ivf.quantizer.verbose = True - index_ivf.cp.verbose = True - - - maxtrain = args.maxtrain - if maxtrain == 0: - if 'IMI' in args.indexkey: - maxtrain = int(256 * 2 ** (np.log2(index_ivf.nlist) / 2)) - elif index_ivf: - maxtrain = 50 * index_ivf.nlist - else: - # just guess... - maxtrain = 256 * 100 - maxtrain = max(maxtrain, 256 * 100) - print("setting maxtrain to %d" % maxtrain) - - # train on dataset - print(f"getting first {maxtrain} dataset vectors for training") - - xt2 = next(ds.get_dataset_iterator(bs=maxtrain)) - - print("train, size", xt2.shape) - assert np.all(np.isfinite(xt2)) - - t0 = time.time() - - if (isinstance(vec_transform, faiss.OPQMatrix) and - isinstance(index_ivf, faiss.IndexIVFPQFastScan)): - print(" Forcing OPQ training PQ to PQ4") - ref_pq = index_ivf.pq - training_pq = faiss.ProductQuantizer( - ref_pq.d, ref_pq.M, ref_pq.nbits - ) - vec_transform.pq - vec_transform.pq = training_pq - - if args.clustering_niter >= 0: - print(("setting nb of clustering iterations to %d" % - args.clustering_niter)) - index_ivf.cp.niter = args.clustering_niter - - train_index = None - if args.train_on_gpu: - print("add a training index on GPU") - train_index = faiss.index_cpu_to_all_gpus( - faiss.IndexFlatL2(index_ivf.d)) - index_ivf.clustering_index = train_index - - index.train(xt2) - print(" Total train time %.3f s" % (time.time() - t0)) - - if train_index is not None: - del train_index - index_ivf.clustering_index = None - gc.collect() - - print("adding") - - t0 = time.time() - - if not args.quantizer_on_gpu_add: - i0 = 0 - for xblock in ds.get_dataset_iterator(bs=args.add_bs): - i1 = i0 + len(xblock) - print(" adding %d:%d / %d [%.3f s, RSS %d kiB] " % ( - i0, i1, ds.nb, time.time() - t0, - faiss.get_mem_usage_kb())) - index.add(xblock) - i0 = i1 - elif True: - quantizer_gpu = faiss.index_cpu_to_all_gpus(index_ivf.quantizer) - - nsplit = args.add_splits - - def produce_batches(sno): - for xblock in ds.get_dataset_iterator(bs=args.add_bs, split=(nsplit, sno)): - _, assign = quantizer_gpu.search(xblock, 1) - yield xblock, assign.ravel() - - i0 = 0 - for sno in range(nsplit): - print(f"============== SPLIT {sno}/{nsplit}") - - stage2 = rate_limited_iter(produce_batches(sno)) - for xblock, assign in stage2: - i1 = i0 + len(xblock) - print(" adding %d:%d / %d [%.3f s, RSS %d kiB] " % ( - i0, i1, ds.nb, time.time() - t0, - faiss.get_mem_usage_kb())) - index.add_core( - len(xblock), - faiss.swig_ptr(xblock), - None, - faiss.swig_ptr(assign) - ) - i0 = i1 - del quantizer_gpu - gc.collect() - - - print(" add in %.3f s" % (time.time() - t0)) - if args.indexfile: - print("storing", args.indexfile) - faiss.write_index(index, args.indexfile) - - return index - - -def compute_inter(a, b): - nq, rank = a.shape - ninter = sum( - np.intersect1d(a[i, :rank], b[i, :rank]).size - for i in range(nq) - ) - return ninter / a.size - - - -def eval_setting_knn(index, xq, gt, k, inter, min_time): - nq = xq.shape[0] - gt_I, gt_D = gt - ivf_stats = faiss.cvar.indexIVF_stats - ivf_stats.reset() - nrun = 0 - - t0 = time.time() - while True: - D, I = index.search(xq, k) - nrun += 1 - t1 = time.time() - if t1 - t0 > min_time: - break - ms_per_query = ((t1 - t0) * 1000.0 / nq / nrun) - if inter: - rank = k - inter_measure = compute_inter(gt[:, :rank], I[:, :rank]) - print("%.4f" % inter_measure, end=' ') - else: - for rank in 1, 10, 100: - n_ok = (I[:, :rank] == gt[:, :1]).sum() - print("%.4f" % (n_ok / float(nq)), end=' ') - print(" %9.5f " % ms_per_query, end=' ') - - if ivf_stats.search_time == 0: - # happens for IVFPQFastScan where the stats are not logged by default - print("%12d %5.2f " % (ivf_stats.ndis / nrun, 0.0), end=' ') - else: - pc_quantizer = ivf_stats.quantization_time / ivf_stats.search_time * 100 - print("%12d %5.2f " % (ivf_stats.ndis / nrun, pc_quantizer), end=' ') - print(nrun) - - -def eval_setting_range(index, xq, gt, radius=0, inter=False, min_time=3.0, query_bs=-1): - nq = xq.shape[0] - gt_nres, gt_I, gt_D = gt - gt_lims = np.zeros(nq + 1, dtype=int) - gt_lims[1:] = np.cumsum(gt_nres) - ivf_stats = faiss.cvar.indexIVF_stats - ivf_stats.reset() - nrun = 0 - t0 = time.time() - while True: - lims, D, I = index.range_search(xq, radius) - nrun += 1 - t1 = time.time() - if t1 - t0 > min_time: - break - ms_per_query = ((t1 - t0) * 1000.0 / nq / nrun) - - ap = eval_range_search.compute_AP((gt_lims, gt_I, gt_D), (lims, I, D)) - print("%.4f" % ap, end=' ') - print(" %9.5f " % ms_per_query, end=' ') - - print("%12d %5d " % (ivf_stats.ndis / nrun, D.size), end=' ') - print(nrun) - - -class IndexQuantizerOnGPU: - """ run query quantization on GPU """ - - def __init__(self, index, search_bs): - self.search_bs = search_bs - index_ivf, vec_transform = unwind_index_ivf(index) - self.index_ivf = index_ivf - self.vec_transform = vec_transform - self.quantizer_gpu = faiss.index_cpu_to_all_gpus(self.index_ivf.quantizer) - - - def produce_batches(self, x, bs): - n = len(x) - nprobe = self.index_ivf.nprobe - ivf_stats = faiss.cvar.indexIVF_stats - for i0 in range(0, n, bs): - xblock = x[i0:i0 + bs] - t0 = time.time() - D, I = self.quantizer_gpu.search(xblock, nprobe) - ivf_stats.quantization_time += 1000 * (time.time() - t0) - yield i0, xblock, D, I - - - def search(self, x, k): - bs = self.search_bs - if self.vec_transform: - x = self.vec_transform(x) - nprobe = self.index_ivf.nprobe - n, d = x.shape - assert self.index_ivf.d == d - D = np.empty((n, k), dtype=np.float32) - I = np.empty((n, k), dtype=np.int64) - - sp = faiss.swig_ptr - stage2 = rate_limited_iter(self.produce_batches(x, bs)) - t0 = time.time() - for i0, xblock, Dc, Ic in stage2: - ni = len(xblock) - self.index_ivf.search_preassigned( - ni, faiss.swig_ptr(xblock), - k, sp(Ic), sp(Dc), - sp(D[i0:]), sp(I[i0:]), - False - ) - - return D, I - - def range_search(self, x, radius): - bs = self.search_bs - if self.vec_transform: - x = self.vec_transform(x) - nprobe = self.index_ivf.nprobe - n, d = x.shape - assert self.index_ivf.d == d - - sp = faiss.swig_ptr - rsp = faiss.rev_swig_ptr - stage2 = rate_limited_iter(self.produce_batches(x, bs)) - t0 = time.time() - all_res = [] - nres = 0 - for i0, xblock, Dc, Ic in stage2: - ni = len(xblock) - res = faiss.RangeSearchResult(ni) - - self.index_ivf.range_search_preassigned( - ni, faiss.swig_ptr(xblock), - radius, sp(Ic), sp(Dc), - res - ) - all_res.append((ni, res)) - lims = rsp(res.lims, ni + 1) - nres += lims[-1] - nres = int(nres) - lims = np.zeros(n + 1, int) - I = np.empty(nres, int) - D = np.empty(nres, 'float32') - - n0 = 0 - for ni, res in all_res: - lims_i = rsp(res.lims, ni + 1) - nd = int(lims_i[-1]) - Di = rsp(res.distances, nd) - Ii = rsp(res.labels, nd) - i0 = int(lims[n0]) - lims[n0: n0 + ni + 1] = lims_i + i0 - I[i0:i0 + nd] = Ii - D[i0:i0 + nd] = Di - n0 += ni - - return lims, D, I - - -def run_experiments_searchparams(ds, index, args): - k = args.k - - xq = ds.get_queries() - - nq = len(xq) - - ps = faiss.ParameterSpace() - ps.initialize(index) - - - # setup the Criterion object - if args.inter: - print("Optimize for intersection @ ", args.k) - header = ( - '%-40s inter@%3d time(ms/q) nb distances %%quantization #runs' % - ("parameters", args.k) - ) - else: - print("Optimize for 1-recall @ 1") - header = ( - '%-40s R@1 R@10 R@100 time(ms/q) nb distances %%quantization #runs' % - "parameters" - ) - - searchparams = args.searchparams - - print(f"Running evaluation on {len(searchparams)} searchparams") - print(header) - maxw = max(max(len(p) for p in searchparams), 40) - - if args.quantizer_on_gpu_search: - index_wrap = IndexQuantizerOnGPU(index, args.search_bs) - else: - index_wrap = index - - for params in searchparams: - ps.set_index_parameters(index, params) - - print(params.ljust(maxw), end=' ') - sys.stdout.flush() - - if ds.search_type() == "knn": - eval_setting_knn( - index_wrap, xq, ds.get_groundtruth(k=args.k), - k=args.k, inter=args.inter, min_time=args.min_test_duration - ) - else: - eval_setting_range( - index_wrap, xq, ds.get_groundtruth(), - radius=args.radius, inter=args.inter, - min_time=args.min_test_duration - ) - - - -def main(): - - parser = argparse.ArgumentParser() - - def aa(*args, **kwargs): - group.add_argument(*args, **kwargs) - - group = parser.add_argument_group('What to do') - aa('--build', default=False, action="store_true") - aa('--search', default=False, action="store_true") - aa('--prepare', default=False, action="store_true", - help="call prepare() to download the dataset before computing") - - group = parser.add_argument_group('dataset options') - aa('--dataset', choices=DATASETS.keys(), required=True) - aa('--basedir', help="override basedir for dataset") - - group = parser.add_argument_group('index consturction') - - aa('--indexkey', default='IVF1204,Flat', help='index_factory type') - aa('--by_residual', default=-1, type=int, - help="set if index should use residuals (default=unchanged)") - aa('--maxtrain', default=0, type=int, - help='maximum number of training points (0 to set automatically)') - aa('--indexfile', default='', help='file to read or write index from') - aa('--add_bs', default=100000, type=int, - help='add elements index by batches of this size') - aa('--no_precomputed_tables', action='store_true', default=False, - help='disable precomputed tables (uses less memory)') - aa('--clustering_niter', default=-1, type=int, - help='number of clustering iterations (-1 = leave default)') - aa('--train_on_gpu', default=False, action='store_true', - help='do training on GPU') - aa('--buildthreads', default=-1, type=int, - help='nb of threads to use at build time') - aa('--quantizer_on_gpu_add', action="store_true", default=False, - help="use GPU coarse quantizer at add time") - aa('--add_splits', default=1, type=int, - help="Do adds in this many splits (otherwise risk of OOM with GPU based adds)") - - group = parser.add_argument_group('searching') - - aa('--k', default=10, type=int, help='nb of nearest neighbors') - aa('--radius', default=96237, type=float, help='radius for range search') - aa('--inter', default=True, action='store_true', - help='use intersection measure instead of 1-recall as metric') - aa('--searchthreads', default=-1, type=int, - help='nb of threads to use at search time') - aa('--searchparams', nargs='+', default=['autotune'], - help="search parameters to use (can be autotune or a list of params)") - aa('--min_test_duration', default=3.0, type=float, - help='run test at least for so long to avoid jitter') - aa('--quantizer_on_gpu_search', action="store_true", default=False, - help="use GPU coarse quantizer at search time") - aa('--parallel_mode', default=-1, type=int, - help="set search-time parallel mode for IVF indexes") - aa('--search_bs', default=8192, type=int, - help='search time batch size (for GPU/CPU tiling)') - - group = parser.add_argument_group('computation options') - aa("--maxRAM", default=-1, type=int, help="set max RSS in GB (avoid OOM crash)") - - - args = parser.parse_args() - - if args.basedir: - print("setting datasets basedir to", args.basedir) - benchmark.datasets.BASEDIR - benchmark.datasets.BASEDIR = args.basedir - - if args.maxRAM > 0: - print("setting max RSS to", args.maxRAM, "GiB") - resource.setrlimit( - resource.RLIMIT_DATA, (args.maxRAM * 1024 ** 3, resource.RLIM_INFINITY) - ) - - os.system('echo -n "nb processors "; ' - 'cat /proc/cpuinfo | grep ^processor | wc -l; ' - 'cat /proc/cpuinfo | grep ^"model name" | tail -1') - - ds = DATASETS[args.dataset]() - print(ds) - - nq, d = ds.nq, ds.d - nb, d = ds.nq, ds.d - - if args.prepare: - print("downloading dataset...") - ds.prepare() - print("dataset ready") - - if not (args.build or args.search): - return - - if args.build: - print("build index, key=", args.indexkey) - index = build_index(args, ds) - else: - print("reading", args.indexfile) - index = faiss.read_index(args.indexfile) - - index_ivf, vec_transform = unwind_index_ivf(index) - if vec_transform is None: - vec_transform = lambda x: x - - if index_ivf is not None: - print("imbalance_factor=", index_ivf.invlists.imbalance_factor()) - - if args.no_precomputed_tables: - if isinstance(index_ivf, faiss.IndexIVFPQ): - print("disabling precomputed table") - index_ivf.use_precomputed_table = -1 - index_ivf.precomputed_table.clear() - - if args.indexfile: - print("index size on disk: ", os.stat(args.indexfile).st_size) - - print("current RSS:", faiss.get_mem_usage_kb() * 1024) - - precomputed_table_size = 0 - if hasattr(index_ivf, 'precomputed_table'): - precomputed_table_size = index_ivf.precomputed_table.size() * 4 - - print("precomputed tables size:", precomputed_table_size) - - if args.search: - - if args.searchthreads == -1: - print("Search threads:", faiss.omp_get_max_threads()) - else: - print("Setting nb of threads to", args.searchthreads) - faiss.omp_set_num_threads(args.searchthreads) - - if args.parallel_mode != -1: - print("setting IVF parallel mode to", args.parallel_mode) - index_ivf.parallel_mode - index_ivf.parallel_mode = args.parallel_mode - - if args.searchparams == ["autotune"]: - run_experiments_autotune(ds, index, args) - else: - run_experiments_searchparams(ds, index, args) - -if __name__ == "__main__": - main() \ No newline at end of file diff --git a/track3_baseline_faiss/plots/T3_deep-1B.png b/track3_baseline_faiss/plots/T3_deep-1B.png deleted file mode 100644 index d6902d6a0..000000000 Binary files a/track3_baseline_faiss/plots/T3_deep-1B.png and /dev/null differ