Skip to content

Commit c1ac072

Browse files
Merge pull request #113 from javadr-forky/dev
feat(available_dataset): enable output redirection & fix typo
2 parents 82b88c7 + 332dd5f commit c1ac072

7 files changed

Lines changed: 9 additions & 9 deletions

File tree

README-PyPI.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -203,7 +203,7 @@ To see all available datasets:
203203
from rankify.dataset.dataset import Dataset
204204

205205
# Display available datasets
206-
Dataset.avaiable_dataset()
206+
Dataset.available_dataset()
207207
```
208208

209209
**BM25 Retriever**

README_zh.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -223,7 +223,7 @@ rm -rf ~/.cache/torch_extensions/*
223223
from rankify.dataset.dataset import Dataset
224224

225225
# 显示可用数据集
226-
Dataset.avaiable_dataset()
226+
Dataset.available_dataset()
227227
```
228228

229229

docs/docs/tutorials/datasets/benchmark_datasets.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -23,7 +23,7 @@ Rankify provides easy access to standard QA benchmark datasets.
2323
from rankify.dataset.dataset import Dataset
2424

2525
# List all available datasets
26-
Dataset.avaiable_dataset()
26+
Dataset.available_dataset()
2727

2828
# Load NQ with BM25 retrieval
2929
dataset = Dataset(

docs/docs/tutorials/retrieval/prebuilt_corpora.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -63,7 +63,7 @@ For benchmarking, Rankify provides pre-retrieved datasets on Hugging Face:
6363
from rankify.dataset.dataset import Dataset
6464

6565
# List available datasets
66-
Dataset.avaiable_dataset()
66+
Dataset.available_dataset()
6767

6868
# Download a pre-retrieved dataset
6969
dataset = Dataset(

examples/retrieved_dataset.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@
22
os.environ["CUDA_VISIBLE_DEVICES"] = "0"
33
from rankify.dataset.dataset import Dataset ,Document, Context, Question,Answer
44
from rankify.metrics.metrics import Metrics
5-
#Dataset.avaiable_dataset()
5+
#Dataset.available_dataset()
66

77

88
datasets = ["web_questions-test"]#, "ChroniclingAmericaQA-test" , "ArchivialQA-test"]#["nq-dev", "nq-test" , "squad1-test", "trivia-dev", "trivia-test", "webq-test", "squad1-dev" ] #

rankify/dataset/dataset.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -657,7 +657,7 @@ def __getitem__(self,idx) -> Document:
657657

658658

659659
@staticmethod
660-
def avaiable_dataset() -> None:
660+
def available_dataset(file=None) -> None:
661661
"""
662662
Prints information about available datasets.
663663
@@ -666,7 +666,7 @@ def avaiable_dataset() -> None:
666666
Dataset.available_dataset()
667667
```
668668
"""
669-
get_datasets_info()
669+
get_datasets_info(file=file)
670670

671671

672672

rankify/utils/dataset/utils.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@
22
import pandas as pd
33
from prettytable import PrettyTable
44

5-
def get_datasets_info():
5+
def get_datasets_info(file=None):
66
table = PrettyTable(['Retriever', 'Dataset', 'Original ext', 'Compressed','Desc','URL'])
77
for retriever, datasets in HF_PRE_DEFIND_DATASET.items():
88
for dataset_name, dataset_info in datasets.items():
@@ -17,4 +17,4 @@ def get_datasets_info():
1717
}
1818
table.add_row(flattened_entry.values())
1919

20-
print(table)
20+
print(table, file=file)

0 commit comments

Comments
 (0)