@@ -93,12 +93,13 @@ jobs:
9393
9494 # Download pre-packaged Wikipedia-100K dataset from GitHub Release
9595 # Dataset: 100K Cohere Wikipedia embeddings (768-dim, float32, cosine distance)
96+ # Source: https://github.com/harsha-simhadri/big-ann-benchmarks
9697 - name : Download wikipedia-100K dataset
9798 env :
9899 GH_TOKEN : ${{ github.token }}
99100 run : |
100101 mkdir -p diskann_rust/target/tmp baseline/target/tmp
101- gh release download benchmark-data- v1 --repo ${{ github.repository }} --pattern 'wikipedia-100K.tar.gz' --dir .
102+ gh release download v1 --repo YuanyuanTian-hh/diskann-benchmark-data --pattern 'wikipedia-100K.tar.gz' --dir .
102103 tar xzf wikipedia-100K.tar.gz -C diskann_rust/target/tmp/
103104 cp -r diskann_rust/target/tmp/wikipedia_cohere baseline/target/tmp/
104105
@@ -203,12 +204,13 @@ jobs:
203204
204205 # Download pre-packaged OpenAI ArXiv 100K dataset from GitHub Release
205206 # Dataset: 100K OpenAI embeddings of ArXiv papers (1536-dim, float32, euclidean distance)
207+ # Source: https://github.com/harsha-simhadri/big-ann-benchmarks
206208 - name : Download openai-100K dataset
207209 env :
208210 GH_TOKEN : ${{ github.token }}
209211 run : |
210212 mkdir -p diskann_rust/target/tmp baseline/target/tmp
211- gh release download benchmark-data- v1 --repo ${{ github.repository }} --pattern 'openai-100K.tar.gz' --dir .
213+ gh release download v1 --repo YuanyuanTian-hh/diskann-benchmark-data --pattern 'openai-100K.tar.gz' --dir .
212214 tar xzf openai-100K.tar.gz -C diskann_rust/target/tmp/
213215 cp -r diskann_rust/target/tmp/OpenAIArXiv baseline/target/tmp/
214216
0 commit comments