lancedb/python/python/tests/test_rerankers.py at main · zebin-code/lancedb

History

384 lines (336 loc) · 12.6 KB

Raw

100

101

102

103

104

105

106

107

108

109

110

111

112

113

114

115

116

117

118

119

120

121

122

123

124

125

126

127

128

129

130

131

132

133

134

135

136

137

138

139

140

141

142

143

144

145

146

147

148

149

150

151

152

153

154

155

156

157

158

159

160

161

162

163

164

165

166

167

168

169

170

171

172

173

174

175

176

177

178

179

180

181

182

183

184

185

186

187

188

189

190

191

192

193

194

195

196

197

198

199

200

201

202

203

204

205

206

207

208

209

210

211

212

213

214

215

216

217

218

219

220

221

222

223

224

225

226

227

228

229

230

231

232

233

234

235

236

237

238

239

240

241

242

243

244

245

246

247

248

249

250

251

252

253

254

255

256

257

258

259

260

261

262

263

264

265

266

267

268

269

270

271

272

273

274

275

276

277

278

279

280

281

282

283

284

285

286

287

288

289

290

291

292

293

294

295

296

297

298

299

300

301

302

303

304

305

306

307

308

309

310

311

312

313

314

315

316

317

318

319

320

321

322

323

324

325

326

327

328

329

330

331

332

333

334

335

336

337

338

339

340

341

342

343

344

345

346

347

348

349

350

351

352

353

354

355

356

357

358

359

360

361

362

363

364

365

366

367

368

369

370

371

372

373

374

375

376

377

378

379

380

381

382

383

384

import os

import random

import lancedb

import numpy as np

import pyarrow as pa

import pytest

from lancedb.conftest import MockTextEmbeddingFunction # noqa

from lancedb.embeddings import EmbeddingFunctionRegistry

from lancedb.pydantic import LanceModel, Vector

from lancedb.rerankers import (

LinearCombinationReranker,

RRFReranker,

CohereReranker,

ColbertReranker,

CrossEncoderReranker,

OpenaiReranker,

JinaReranker,

AnswerdotaiRerankers,

VoyageAIReranker,

)

from lancedb.table import LanceTable

# Tests rely on FTS index

pytest.importorskip("lancedb.fts")

def get_test_table(tmp_path, use_tantivy):

db = lancedb.connect(tmp_path)

# Create a LanceDB table schema with a vector and a text column

emb = EmbeddingFunctionRegistry.get_instance().get("test")()

meta_emb = EmbeddingFunctionRegistry.get_instance().get("test")()

class MyTable(LanceModel):

text: str = emb.SourceField()

vector: Vector(emb.ndims()) = emb.VectorField()

meta: str = meta_emb.SourceField()

meta_vector: Vector(meta_emb.ndims()) = meta_emb.VectorField()

# Initialize the table using the schema

table = LanceTable.create(

db,

"my_table",

schema=MyTable,

)

# Need to test with a bunch of phrases to make sure sorting is consistent

phrases = [

"great kid don't get cocky",

"now that's a name I haven't heard in a long time",

"if you strike me down I shall become more powerful than you imagine",

"I find your lack of faith disturbing",

"I've got a bad feeling about this",

"never tell me the odds",

"I am your father",

"somebody has to save our skins",

"New strategy R2 let the wookiee win",

"Arrrrggghhhhhhh",

"I see a mansard roof through the trees",

"I see a salty message written in the eves",

"the ground beneath my feet",

"the hot garbage and concrete",

"and now the tops of buildings",

"everybody with a worried mind could never forgive the sight",

"of wicked snakes inside a place you thought was dignified",

"I don't wanna live like this",

"but I don't wanna die",

"The templars want control",

"the brotherhood of assassins want freedom",

"if only they could both see the world as it really is",

"there would be peace",

"but the war goes on",

"altair's legacy was a warning",

"Kratos had a son",

"he was a god",

"the god of war",

"but his son was mortal",

"there hasn't been a good battlefield game since 2142",

"I wish they would make another one",

"campains are not as good as they used to be",

"Multiplayer and open world games have destroyed the single player experience",

"Maybe the future is console games",

"I don't know",

]

# Add the phrases and vectors to the table

table.add(

[

{"text": p, "meta": phrases[random.randint(0, len(phrases) - 1)]}

for p in phrases

]

)

# Create a fts index

table.create_fts_index("text", use_tantivy=use_tantivy)

return table, MyTable

def _run_test_reranker(reranker, table, query, query_vector, schema):

# Hybrid search setting

result1 = (

table.search(query, query_type="hybrid", vector_column_name="vector")

.rerank(normalize="score", reranker=reranker)

.to_pydantic(schema)

)

result2 = (

table.search(query, query_type="hybrid", vector_column_name="vector")

.rerank(reranker=reranker)

.to_pydantic(schema)

)

assert result1 == result2

query_vector = table.to_pandas()["vector"][0]

result = (

table.search(query_type="hybrid", vector_column_name="vector")

.vector(query_vector)

.text(query)

.limit(30)

.rerank(reranker=reranker)

.to_arrow()

)

assert len(result) == 30

ascending_relevance_err = (

"The _relevance_score column of the results returned by the reranker "

"represents the relevance of the result to the query & should "

"be descending."

)

assert np.all(

np.diff(result.column("_relevance_score").to_numpy()) <= 0

), ascending_relevance_err

# Vector search setting

result = (

table.search(query, vector_column_name="vector")

.rerank(reranker=reranker)

.limit(30)

.to_arrow()

)

assert len(result) == 30

assert np.all(

np.diff(result.column("_relevance_score").to_numpy()) <= 0

), ascending_relevance_err

result_explicit = (

table.search(query_vector, vector_column_name="vector")

.rerank(reranker=reranker, query_string=query)

.limit(30)

.to_arrow()

)

assert len(result_explicit) == 30

with pytest.raises(

ValueError

): # This raises an error because vector query is provided without reanking query

table.search(query_vector, vector_column_name="vector").rerank(

reranker=reranker

).limit(30).to_arrow()

# FTS search setting

result = (

table.search(query, query_type="fts", vector_column_name="vector")

.rerank(reranker=reranker)

.limit(30)

.to_arrow()

)

assert len(result) > 0

assert np.all(

np.diff(result.column("_relevance_score").to_numpy()) <= 0

), ascending_relevance_err

# empty FTS results

query = "abcxyz" * 100

result = (

table.search(query_type="hybrid", vector_column_name="vector")

.vector(query_vector)

.text(query)

.limit(30)

.rerank(reranker=reranker)

.to_arrow()

)

# should return _relevance_score column

assert "_relevance_score" in result.column_names

assert np.all(

np.diff(result.column("_relevance_score").to_numpy()) <= 0

), ascending_relevance_err

# Multi-vector search setting

rs1 = table.search(query, vector_column_name="vector").limit(10).with_row_id(True)

rs2 = (

table.search(query, vector_column_name="meta_vector")

.limit(10)

.with_row_id(True)

)

result = reranker.rerank_multivector([rs1, rs2], query)

assert len(result) == 20

result_deduped = reranker.rerank_multivector(

[rs1, rs2, rs1], query, deduplicate=True

)

assert len(result_deduped) <= 20

result_arrow = reranker.rerank_multivector([rs1.to_arrow(), rs2.to_arrow()], query)

assert len(result) == 20 and result == result_arrow

def _run_test_hybrid_reranker(reranker, tmp_path, use_tantivy):

table, schema = get_test_table(tmp_path, use_tantivy)

# The default reranker

result1 = (

table.search(

"Our father who art in heaven",

query_type="hybrid",

vector_column_name="vector",

)

.rerank(normalize="score")

.to_pydantic(schema)

)

result2 = ( # noqa

table.search(

"Our father who art in heaven.",

query_type="hybrid",

vector_column_name="vector",

)

.rerank(normalize="rank")

.to_pydantic(schema)

)

result3 = table.search(

"Our father who art in heaven..",

query_type="hybrid",

vector_column_name="vector",

).to_pydantic(schema)

assert result1 == result3 # 2 & 3 should be the same as they use score as score

query = "Our father who art in heaven"

query_vector = table.to_pandas()["vector"][0]

result = (

table.search(query_type="hybrid", vector_column_name="vector")

.vector(query_vector)

.text(query)

.limit(30)

.rerank(reranker, normalize="score")

.to_arrow()

)

assert len(result) == 30

# Fail if both query and (vector or text) are provided

with pytest.raises(ValueError):

table.search(query, query_type="hybrid", vector_column_name="vector").vector(

query_vector

).to_arrow()

with pytest.raises(ValueError):

table.search(query, query_type="hybrid", vector_column_name="vector").text(

query

).to_arrow()

ascending_relevance_err = (

"The _relevance_score column of the results returned by the reranker "

"represents the relevance of the result to the query & should "

"be descending."

)

assert np.all(

np.diff(result.column("_relevance_score").to_numpy()) <= 0

), ascending_relevance_err

# Test with empty FTS results

query = "abcxyz" * 100

result = (

table.search(query_type="hybrid", vector_column_name="vector")

.vector(query_vector)

.text(query)

.limit(30)

.rerank(reranker=reranker)

.to_arrow()

)

# should return _relevance_score column

assert "_relevance_score" in result.column_names

assert np.all(

np.diff(result.column("_relevance_score").to_numpy()) <= 0

), ascending_relevance_err

@pytest.mark.parametrize("use_tantivy", [True, False])

def test_linear_combination(tmp_path, use_tantivy):

reranker = LinearCombinationReranker()

vector_results = pa.Table.from_pydict(

{

"_rowid": [0, 1, 2, 3, 4],

"_distance": [0.1, 0.2, 0.3, 0.4, 0.5],

"_text": ["a", "b", "c", "d", "e"],

}

)

fts_results = pa.Table.from_pydict(

{

"_rowid": [1, 2, 3, 4, 5],

"_score": [0.1, 0.2, 0.3, 0.4, 0.5],

"_text": ["b", "c", "d", "e", "f"],

}

)

combined_results = reranker.merge_results(vector_results, fts_results, 1.0)

assert len(combined_results) == 6

assert "_rowid" in combined_results.column_names

assert "_text" in combined_results.column_names

assert "_distance" not in combined_results.column_names

assert "_score" not in combined_results.column_names

assert "_relevance_score" in combined_results.column_names

_run_test_hybrid_reranker(reranker, tmp_path, use_tantivy)

@pytest.mark.parametrize("use_tantivy", [True, False])

def test_rrf_reranker(tmp_path, use_tantivy):

reranker = RRFReranker()

_run_test_hybrid_reranker(reranker, tmp_path, use_tantivy)

@pytest.mark.skipif(

os.environ.get("COHERE_API_KEY") is None, reason="COHERE_API_KEY not set"

)

@pytest.mark.parametrize("use_tantivy", [True, False])

def test_cohere_reranker(tmp_path, use_tantivy):

pytest.importorskip("cohere")

reranker = CohereReranker()

table, schema = get_test_table(tmp_path, use_tantivy)

_run_test_reranker(reranker, table, "single player experience", None, schema)

@pytest.mark.parametrize("use_tantivy", [True, False])

def test_cross_encoder_reranker(tmp_path, use_tantivy):

pytest.importorskip("sentence_transformers")

reranker = CrossEncoderReranker()

table, schema = get_test_table(tmp_path, use_tantivy)

_run_test_reranker(reranker, table, "single player experience", None, schema)

@pytest.mark.parametrize("use_tantivy", [True, False])

def test_colbert_reranker(tmp_path, use_tantivy):

pytest.importorskip("rerankers")

reranker = ColbertReranker()

table, schema = get_test_table(tmp_path, use_tantivy)

_run_test_reranker(reranker, table, "single player experience", None, schema)

@pytest.mark.parametrize("use_tantivy", [True, False])

def test_answerdotai_reranker(tmp_path, use_tantivy):

pytest.importorskip("rerankers")

reranker = AnswerdotaiRerankers()

table, schema = get_test_table(tmp_path, use_tantivy)

_run_test_reranker(reranker, table, "single player experience", None, schema)

@pytest.mark.skipif(

os.environ.get("OPENAI_API_KEY") is None, reason="OPENAI_API_KEY not set"

)

@pytest.mark.parametrize("use_tantivy", [True, False])

def test_openai_reranker(tmp_path, use_tantivy):

pytest.importorskip("openai")

table, schema = get_test_table(tmp_path, use_tantivy)

reranker = OpenaiReranker()

_run_test_reranker(reranker, table, "single player experience", None, schema)

@pytest.mark.skipif(

os.environ.get("JINA_API_KEY") is None, reason="JINA_API_KEY not set"

)

@pytest.mark.parametrize("use_tantivy", [True, False])

def test_jina_reranker(tmp_path, use_tantivy):

pytest.importorskip("jina")

table, schema = get_test_table(tmp_path, use_tantivy)

reranker = JinaReranker()

_run_test_reranker(reranker, table, "single player experience", None, schema)

@pytest.mark.skipif(

os.environ.get("VOYAGE_API_KEY") is None, reason="VOYAGE_API_KEY not set"

)

@pytest.mark.parametrize("use_tantivy", [True, False])

def test_voyageai_reranker(tmp_path, use_tantivy):

pytest.importorskip("voyageai")

reranker = VoyageAIReranker(model_name="rerank-2")

table, schema = get_test_table(tmp_path, use_tantivy)

_run_test_reranker(reranker, table, "single player experience", None, schema)

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

test_rerankers.py

Latest commit

History

test_rerankers.py

File metadata and controls