Evaluate

`Qrels`

Bases: object

Qrels, or query relevance judgments, stores the ground truth for conducting evaluations.

The preferred way for creating a Qrels instance is converting Python dictionary as follows:

qrels_dict = {
    "q_1": {
        "d_1": 1,
        "d_2": 2,
    },
    "q_2": {
        "d_3": 2,
        "d_2": 1,
        "d_5": 3,
    },
}

qrels = Qrels(qrels_dict, name="MSMARCO")

qrels = Qrels()  # Creates an empty Qrels with no name

Source code in ranx/data_structures/qrels.py

class Qrels(object):
    """`Qrels`, or _query relevance judgments_, stores the ground truth for conducting evaluations.

    The preferred way for creating a `Qrels` instance is converting Python dictionary as follows:

    ```python
    qrels_dict = {
        "q_1": {
            "d_1": 1,
            "d_2": 2,
        },
        "q_2": {
            "d_3": 2,
            "d_2": 1,
            "d_5": 3,
        },
    }

    qrels = Qrels(qrels_dict, name="MSMARCO")

    qrels = Qrels()  # Creates an empty Qrels with no name
    ```
    """

    def __init__(self, qrels: Dict[str, Dict[str, int]] = None, name: str = None):
        if qrels is None:
            self.qrels = TypedDict.empty(
                key_type=types.unicode_type,
                value_type=types.DictType(types.unicode_type, types.int64),
            )
            self.sorted = False
        else:
            # Query IDs
            q_ids = list(qrels.keys())
            q_ids = TypedList(q_ids)

            # Doc IDs
            doc_ids = [list(doc.keys()) for doc in qrels.values()]
            max_len = max(len(y) for x in doc_ids for y in x)
            dtype = f"<U{max_len}"
            doc_ids = TypedList([np.array(x, dtype=dtype) for x in doc_ids])

            # Scores
            scores = [list(doc.values()) for doc in qrels.values()]
            scores = TypedList([np.array(x, dtype=int) for x in scores])

            self.qrels = create_and_sort(q_ids, doc_ids, scores)
            self.sorted = True

        self.name = name

    def keys(self):
        """Returns query ids. Used internally."""
        return self.qrels.keys()

    def add_score(self, q_id: str, doc_id: str, score: int):
        """Add a (doc_id, score) pair to a query (or, change its value if it already exists).

        Args:
            q_id (str): Query ID
            doc_id (str): Document ID
            score (int): Relevance score judgment
        """
        if self.qrels.get(q_id) is None:
            self.qrels[q_id] = TypedDict.empty(
                key_type=types.unicode_type,
                value_type=types.int64,
            )
        self.qrels[q_id][doc_id] = int(score)
        self.sorted = False

    def add(self, q_id: str, doc_ids: List[str], scores: List[int]):
        """Add a query and its relevant documents with the associated relevance score judgment.

        Args:
            q_id (str): Query ID
            doc_ids (List[str]): List of Document IDs
            scores (List[int]): List of relevance score judgments
        """
        self.add_multi([q_id], [doc_ids], [scores])

    def add_multi(
        self,
        q_ids: List[str],
        doc_ids: List[List[str]],
        scores: List[List[int]],
    ):
        """Add multiple queries at once.

        Args:
            q_ids (List[str]): List of Query IDs
            doc_ids (List[List[str]]): List of list of Document IDs
            scores (List[List[int]]): List of list of relevance score judgments
        """
        q_ids = TypedList(q_ids)
        doc_ids = TypedList([TypedList(x) for x in doc_ids])
        scores = TypedList([TypedList(map(int, x)) for x in scores])

        self.qrels = add_and_sort(self.qrels, q_ids, doc_ids, scores)
        self.sorted = True

    def set_relevance_level(self, rel_lvl: int = 1):
        """Sets relevance level."""
        self.qrels = _set_relevance_level(self.qrels, rel_lvl)

    def get_query_ids(self):
        """Returns query ids."""
        return list(self.qrels.keys())

    def get_doc_ids_and_scores(self):
        """Returns doc ids and relevance judgments."""
        return list(self.qrels.values())

    # Sort in place
    def sort(self):
        """Sort. Used internally."""
        self.qrels = sort_dict_by_key(self.qrels)
        self.qrels = sort_dict_of_dict_by_value(self.qrels)
        self.sorted = True

    def to_typed_list(self):
        """Convert Qrels to Numba Typed List. Used internally."""
        if not self.sorted:
            self.sort()
        return to_typed_list(self.qrels)

    def to_dict(self) -> Dict[str, Dict[str, int]]:
        """Convert Qrels to Python dictionary.

        Returns:
            Dict[str, Dict[str, int]]: Qrels as Python dictionary
        """
        d = defaultdict(dict)
        for q_id in self.keys():
            d[q_id] = dict(self[q_id])
        return d

    def to_dataframe(self) -> pd.DataFrame:
        """Convert Qrels to Pandas DataFrame with the following columns: `q_id`, `doc_id`, and `score`.

        Returns:
            pandas.DataFrame: Qrels as Pandas DataFrame.
        """
        data = {"q_id": [], "doc_id": [], "score": []}

        for q_id in self.qrels:
            for doc_id in self.qrels[q_id]:
                data["q_id"].append(q_id)
                data["doc_id"].append(doc_id)
                data["score"].append(self.qrels[q_id][doc_id])

        return pd.DataFrame.from_dict(data)

    def save(self, path: str = "qrels.json", kind: str = None) -> None:
        """Write `qrels` to `path` as JSON file, TREC qrels format, or Parquet file. File type is automatically inferred form the filename extension: ".json" -> "json", ".trec" -> "trec", ".txt" -> "trec", ".parq" -> "parquet", ".parquet" -> "parquet". Use the "kind" argument to override this behavior.

        Args:
            path (str, optional): Saving path. Defaults to "qrels.json".
            kind (str, optional): Kind of file to save, must be either "json" or "trec". If None, it will be automatically inferred from the filename extension.
        """
        # Infer file extension -------------------------------------------------
        kind = get_file_kind(path, kind)

        # Save Qrels -----------------------------------------------------------
        if kind == "json":
            with open(path, "wb") as f:
                f.write(orjson.dumps(self.to_dict(), option=orjson.OPT_INDENT_2))
        elif kind == "parquet":
            self.to_dataframe().to_parquet(path, index=False)
        else:
            with open(path, "w") as f:
                for i, q_id in enumerate(self.qrels.keys()):
                    for j, doc_id in enumerate(self.qrels[q_id].keys()):
                        score = self.qrels[q_id][doc_id]
                        f.write(f"{q_id} 0 {doc_id} {score}")

                        if (
                            i != len(self.qrels.keys()) - 1
                            or j != len(self.qrels[q_id].keys()) - 1
                        ):
                            f.write("\n")

    @staticmethod
    def from_dict(d: Dict[str, Dict[str, int]]):
        """Convert a Python dictionary in form of {q_id: {doc_id: score}} to ranx.Qrels.

        Args:
            d (Dict[str, Dict[str, int]]): Qrels as Python dictionary

        Returns:
            Qrels: ranx.Qrels
        """
        # Query IDs
        q_ids = list(d.keys())
        q_ids = TypedList(q_ids)

        # Doc IDs
        doc_ids = [list(doc.keys()) for doc in d.values()]
        max_len = max(len(y) for x in doc_ids for y in x)
        dtype = f"<U{max_len}"
        doc_ids = TypedList([np.array(x, dtype=dtype) for x in doc_ids])

        # Scores
        scores = [list(doc.values()) for doc in d.values()]
        scores = TypedList([np.array(x, dtype=int) for x in scores])

        qrels = Qrels()
        qrels.qrels = create_and_sort(q_ids, doc_ids, scores)
        qrels.sorted = True

        return qrels

    @staticmethod
    def from_file(path: str, kind: str = None):
        """Parse a qrels file into ranx.Qrels. Supported formats are JSON, TREC qrels, and gzipped TREC qrels. Correct import behavior is inferred from the file extension: ".json" -> "json", ".trec" -> "trec", ".txt" -> "trec", ".gz" -> "gzipped trec". Use the "kind" argument to override this behavior.

        Args:
            path (str): File path.
            kind (str, optional): Kind of file to load, must be either "json" or "trec".

        Returns:
            Qrels: ranx.Qrels
        """
        # Infer file extension -------------------------------------------------
        kind = get_file_kind(path, kind)

        # Load Qrels -----------------------------------------------------------
        if kind == "json":
            qrels = orjson.loads(open(path, "rb").read())
        else:
            qrels = defaultdict(dict)
            with gzip.open(path, "rt") if kind == "gz" else open(path) as f:
                for line in f:
                    q_id, _, doc_id, rel = line.split()
                    qrels[q_id][doc_id] = int(rel)

        return Qrels.from_dict(qrels)

    @staticmethod
    def from_df(
        df: pd.DataFrame,
        q_id_col: str = "q_id",
        doc_id_col: str = "doc_id",
        score_col: str = "score",
    ):
        """Convert a Pandas DataFrame to ranx.Qrels.

        Args:
            df (pandas.DataFrame): Qrels as Pandas DataFrame.
            q_id_col (str, optional): Query IDs column. Defaults to "q_id".
            doc_id_col (str, optional): Document IDs column. Defaults to "doc_id".
            score_col (str, optional): Relevance score judgments column. Defaults to "score".

        Returns:
            Qrels: ranx.Qrels
        """
        assert (
            df[q_id_col].dtype == "O"
        ), "DataFrame Query IDs column dtype must be `object` (string)"
        assert (
            df[doc_id_col].dtype == "O"
        ), "DataFrame Document IDs column dtype must be `object` (string)"
        assert (
            df[score_col].dtype == np.int64
        ), "DataFrame scores column dtype must be `int`"

        qrels_dict = (
            df.groupby(q_id_col)[[doc_id_col, score_col]]
            .apply(lambda g: {x[0]: x[1] for x in g.values.tolist()})
            .to_dict()
        )

        return Qrels.from_dict(qrels_dict)

    @staticmethod
    def from_parquet(
        path: str,
        q_id_col: str = "q_id",
        doc_id_col: str = "doc_id",
        score_col: str = "score",
        pd_kwargs: Dict[str, Any] = None,
    ):
        """Convert a Parquet file to ranx.Qrels.

        Args:
            path (str): File path.
            q_id_col (str, optional): Query IDs column. Defaults to "q_id".
            doc_id_col (str, optional): Document IDs column. Defaults to "doc_id".
            score_col (str, optional): Relevance score judgments column. Defaults to "score".
            pd_kwargs (Dict[str, Any], optional): Additional arguments to pass to `pandas.read_parquet` (see https://pandas.pydata.org/docs/reference/api/pandas.read_parquet.html). Defaults to None.

        Returns:
            Qrels: ranx.Qrels
        """
        pd_kwargs = {} if pd_kwargs is None else pd_kwargs

        return Qrels.from_df(
            df=pd.read_parquet(path, *pd_kwargs),
            q_id_col=q_id_col,
            doc_id_col=doc_id_col,
            score_col=score_col,
        )

    @staticmethod
    def from_ir_datasets(dataset_id: str):
        """Convert `ir-datasets` qrels into ranx.Qrels. It automatically downloads data if missing.
        Args:
            dataset_id (str): ID of the detaset in `ir-datasets`. `ir-datasets` catalog is available here: https://ir-datasets.com/index.html.
        Returns:
            Qrels: ranx.Qrels
        """
        qrels = Qrels.from_dict(ir_datasets.load(dataset_id).qrels_dict())
        qrels.name = dataset_id
        return qrels

    @property
    def size(self):
        return len(self.qrels)

    def __getitem__(self, q_id):
        return dict(self.qrels[q_id])

    def __len__(self) -> int:
        return len(self.qrels)

    def __repr__(self):
        return self.qrels.__repr__()

    def __str__(self):
        return self.qrels.__str__()

`add(q_id, doc_ids, scores)`

Add a query and its relevant documents with the associated relevance score judgment.

Parameters:

Name	Type	Description	Default
`q_id`	`str`	Query ID	required
`doc_ids`	`List[str]`	List of Document IDs	required
`scores`	`List[int]`	List of relevance score judgments	required

Source code in ranx/data_structures/qrels.py

def add(self, q_id: str, doc_ids: List[str], scores: List[int]):
    """Add a query and its relevant documents with the associated relevance score judgment.

    Args:
        q_id (str): Query ID
        doc_ids (List[str]): List of Document IDs
        scores (List[int]): List of relevance score judgments
    """
    self.add_multi([q_id], [doc_ids], [scores])

`add_multi(q_ids, doc_ids, scores)`

Add multiple queries at once.

Parameters:

Name	Type	Description	Default
`q_ids`	`List[str]`	List of Query IDs	required
`doc_ids`	`List[List[str]]`	List of list of Document IDs	required
`scores`	`List[List[int]]`	List of list of relevance score judgments	required

Source code in ranx/data_structures/qrels.py

def add_multi(
    self,
    q_ids: List[str],
    doc_ids: List[List[str]],
    scores: List[List[int]],
):
    """Add multiple queries at once.

    Args:
        q_ids (List[str]): List of Query IDs
        doc_ids (List[List[str]]): List of list of Document IDs
        scores (List[List[int]]): List of list of relevance score judgments
    """
    q_ids = TypedList(q_ids)
    doc_ids = TypedList([TypedList(x) for x in doc_ids])
    scores = TypedList([TypedList(map(int, x)) for x in scores])

    self.qrels = add_and_sort(self.qrels, q_ids, doc_ids, scores)
    self.sorted = True

`add_score(q_id, doc_id, score)`

Add a (doc_id, score) pair to a query (or, change its value if it already exists).

Parameters:

Name	Type	Description	Default
`q_id`	`str`	Query ID	required
`doc_id`	`str`	Document ID	required
`score`	`int`	Relevance score judgment	required

Source code in ranx/data_structures/qrels.py

def add_score(self, q_id: str, doc_id: str, score: int):
    """Add a (doc_id, score) pair to a query (or, change its value if it already exists).

    Args:
        q_id (str): Query ID
        doc_id (str): Document ID
        score (int): Relevance score judgment
    """
    if self.qrels.get(q_id) is None:
        self.qrels[q_id] = TypedDict.empty(
            key_type=types.unicode_type,
            value_type=types.int64,
        )
    self.qrels[q_id][doc_id] = int(score)
    self.sorted = False

`from_df(df, q_id_col='q_id', doc_id_col='doc_id', score_col='score')` `staticmethod`

Convert a Pandas DataFrame to ranx.Qrels.

Parameters:

Name	Type	Description	Default
`df`	`DataFrame`	Qrels as Pandas DataFrame.	required
`q_id_col`	`str`	Query IDs column. Defaults to "q_id".	`'q_id'`
`doc_id_col`	`str`	Document IDs column. Defaults to "doc_id".	`'doc_id'`
`score_col`	`str`	Relevance score judgments column. Defaults to "score".	`'score'`

Returns:

Name	Type	Description
`Qrels`		ranx.Qrels

Source code in ranx/data_structures/qrels.py

@staticmethod
def from_df(
    df: pd.DataFrame,
    q_id_col: str = "q_id",
    doc_id_col: str = "doc_id",
    score_col: str = "score",
):
    """Convert a Pandas DataFrame to ranx.Qrels.

    Args:
        df (pandas.DataFrame): Qrels as Pandas DataFrame.
        q_id_col (str, optional): Query IDs column. Defaults to "q_id".
        doc_id_col (str, optional): Document IDs column. Defaults to "doc_id".
        score_col (str, optional): Relevance score judgments column. Defaults to "score".

    Returns:
        Qrels: ranx.Qrels
    """
    assert (
        df[q_id_col].dtype == "O"
    ), "DataFrame Query IDs column dtype must be `object` (string)"
    assert (
        df[doc_id_col].dtype == "O"
    ), "DataFrame Document IDs column dtype must be `object` (string)"
    assert (
        df[score_col].dtype == np.int64
    ), "DataFrame scores column dtype must be `int`"

    qrels_dict = (
        df.groupby(q_id_col)[[doc_id_col, score_col]]
        .apply(lambda g: {x[0]: x[1] for x in g.values.tolist()})
        .to_dict()
    )

    return Qrels.from_dict(qrels_dict)

`from_dict(d)` `staticmethod`

Convert a Python dictionary in form of {q_id: {doc_id: score}} to ranx.Qrels.

Parameters:

Name	Type	Description	Default
`d`	`Dict[str, Dict[str, int]]`	Qrels as Python dictionary	required

Returns:

Name	Type	Description
`Qrels`		ranx.Qrels

Source code in ranx/data_structures/qrels.py

@staticmethod
def from_dict(d: Dict[str, Dict[str, int]]):
    """Convert a Python dictionary in form of {q_id: {doc_id: score}} to ranx.Qrels.

    Args:
        d (Dict[str, Dict[str, int]]): Qrels as Python dictionary

    Returns:
        Qrels: ranx.Qrels
    """
    # Query IDs
    q_ids = list(d.keys())
    q_ids = TypedList(q_ids)

    # Doc IDs
    doc_ids = [list(doc.keys()) for doc in d.values()]
    max_len = max(len(y) for x in doc_ids for y in x)
    dtype = f"<U{max_len}"
    doc_ids = TypedList([np.array(x, dtype=dtype) for x in doc_ids])

    # Scores
    scores = [list(doc.values()) for doc in d.values()]
    scores = TypedList([np.array(x, dtype=int) for x in scores])

    qrels = Qrels()
    qrels.qrels = create_and_sort(q_ids, doc_ids, scores)
    qrels.sorted = True

    return qrels

`from_file(path, kind=None)` `staticmethod`

Parse a qrels file into ranx.Qrels. Supported formats are JSON, TREC qrels, and gzipped TREC qrels. Correct import behavior is inferred from the file extension: ".json" -> "json", ".trec" -> "trec", ".txt" -> "trec", ".gz" -> "gzipped trec". Use the "kind" argument to override this behavior.

Parameters:

Name	Type	Description	Default
`path`	`str`	File path.	required
`kind`	`str`	Kind of file to load, must be either "json" or "trec".	`None`

Returns:

Name	Type	Description
`Qrels`		ranx.Qrels

Source code in ranx/data_structures/qrels.py

@staticmethod
def from_file(path: str, kind: str = None):
    """Parse a qrels file into ranx.Qrels. Supported formats are JSON, TREC qrels, and gzipped TREC qrels. Correct import behavior is inferred from the file extension: ".json" -> "json", ".trec" -> "trec", ".txt" -> "trec", ".gz" -> "gzipped trec". Use the "kind" argument to override this behavior.

    Args:
        path (str): File path.
        kind (str, optional): Kind of file to load, must be either "json" or "trec".

    Returns:
        Qrels: ranx.Qrels
    """
    # Infer file extension -------------------------------------------------
    kind = get_file_kind(path, kind)

    # Load Qrels -----------------------------------------------------------
    if kind == "json":
        qrels = orjson.loads(open(path, "rb").read())
    else:
        qrels = defaultdict(dict)
        with gzip.open(path, "rt") if kind == "gz" else open(path) as f:
            for line in f:
                q_id, _, doc_id, rel = line.split()
                qrels[q_id][doc_id] = int(rel)

    return Qrels.from_dict(qrels)

`from_ir_datasets(dataset_id)` `staticmethod`

Convert ir-datasets qrels into ranx.Qrels. It automatically downloads data if missing. Args: dataset_id (str): ID of the detaset in ir-datasets. ir-datasets catalog is available here: https://ir-datasets.com/index.html. Returns: Qrels: ranx.Qrels

Source code in ranx/data_structures/qrels.py

@staticmethod
def from_ir_datasets(dataset_id: str):
    """Convert `ir-datasets` qrels into ranx.Qrels. It automatically downloads data if missing.
    Args:
        dataset_id (str): ID of the detaset in `ir-datasets`. `ir-datasets` catalog is available here: https://ir-datasets.com/index.html.
    Returns:
        Qrels: ranx.Qrels
    """
    qrels = Qrels.from_dict(ir_datasets.load(dataset_id).qrels_dict())
    qrels.name = dataset_id
    return qrels

`from_parquet(path, q_id_col='q_id', doc_id_col='doc_id', score_col='score', pd_kwargs=None)` `staticmethod`

Convert a Parquet file to ranx.Qrels.

Parameters:

Name	Type	Description	Default
`path`	`str`	File path.	required
`q_id_col`	`str`	Query IDs column. Defaults to "q_id".	`'q_id'`
`doc_id_col`	`str`	Document IDs column. Defaults to "doc_id".	`'doc_id'`
`score_col`	`str`	Relevance score judgments column. Defaults to "score".	`'score'`
`pd_kwargs`	`Dict[str, Any]`	Additional arguments to pass to `pandas.read_parquet` (see https://pandas.pydata.org/docs/reference/api/pandas.read_parquet.html). Defaults to None.	`None`

Returns:

Name	Type	Description
`Qrels`		ranx.Qrels

Source code in ranx/data_structures/qrels.py

@staticmethod
def from_parquet(
    path: str,
    q_id_col: str = "q_id",
    doc_id_col: str = "doc_id",
    score_col: str = "score",
    pd_kwargs: Dict[str, Any] = None,
):
    """Convert a Parquet file to ranx.Qrels.

    Args:
        path (str): File path.
        q_id_col (str, optional): Query IDs column. Defaults to "q_id".
        doc_id_col (str, optional): Document IDs column. Defaults to "doc_id".
        score_col (str, optional): Relevance score judgments column. Defaults to "score".
        pd_kwargs (Dict[str, Any], optional): Additional arguments to pass to `pandas.read_parquet` (see https://pandas.pydata.org/docs/reference/api/pandas.read_parquet.html). Defaults to None.

    Returns:
        Qrels: ranx.Qrels
    """
    pd_kwargs = {} if pd_kwargs is None else pd_kwargs

    return Qrels.from_df(
        df=pd.read_parquet(path, *pd_kwargs),
        q_id_col=q_id_col,
        doc_id_col=doc_id_col,
        score_col=score_col,
    )

`get_doc_ids_and_scores()`

Returns doc ids and relevance judgments.

Source code in ranx/data_structures/qrels.py

def get_doc_ids_and_scores(self):
    """Returns doc ids and relevance judgments."""
    return list(self.qrels.values())

`get_query_ids()`

Returns query ids.

Source code in ranx/data_structures/qrels.py

def get_query_ids(self):
    """Returns query ids."""
    return list(self.qrels.keys())

`keys()`

Returns query ids. Used internally.

Source code in ranx/data_structures/qrels.py

def keys(self):
    """Returns query ids. Used internally."""
    return self.qrels.keys()

`save(path='qrels.json', kind=None)`

Write qrels to path as JSON file, TREC qrels format, or Parquet file. File type is automatically inferred form the filename extension: ".json" -> "json", ".trec" -> "trec", ".txt" -> "trec", ".parq" -> "parquet", ".parquet" -> "parquet". Use the "kind" argument to override this behavior.

Parameters:

Name	Type	Description	Default
`path`	`str`	Saving path. Defaults to "qrels.json".	`'qrels.json'`
`kind`	`str`	Kind of file to save, must be either "json" or "trec". If None, it will be automatically inferred from the filename extension.	`None`

Source code in ranx/data_structures/qrels.py

def save(self, path: str = "qrels.json", kind: str = None) -> None:
    """Write `qrels` to `path` as JSON file, TREC qrels format, or Parquet file. File type is automatically inferred form the filename extension: ".json" -> "json", ".trec" -> "trec", ".txt" -> "trec", ".parq" -> "parquet", ".parquet" -> "parquet". Use the "kind" argument to override this behavior.

    Args:
        path (str, optional): Saving path. Defaults to "qrels.json".
        kind (str, optional): Kind of file to save, must be either "json" or "trec". If None, it will be automatically inferred from the filename extension.
    """
    # Infer file extension -------------------------------------------------
    kind = get_file_kind(path, kind)

    # Save Qrels -----------------------------------------------------------
    if kind == "json":
        with open(path, "wb") as f:
            f.write(orjson.dumps(self.to_dict(), option=orjson.OPT_INDENT_2))
    elif kind == "parquet":
        self.to_dataframe().to_parquet(path, index=False)
    else:
        with open(path, "w") as f:
            for i, q_id in enumerate(self.qrels.keys()):
                for j, doc_id in enumerate(self.qrels[q_id].keys()):
                    score = self.qrels[q_id][doc_id]
                    f.write(f"{q_id} 0 {doc_id} {score}")

                    if (
                        i != len(self.qrels.keys()) - 1
                        or j != len(self.qrels[q_id].keys()) - 1
                    ):
                        f.write("\n")

`set_relevance_level(rel_lvl=1)`

Sets relevance level.

Source code in ranx/data_structures/qrels.py

def set_relevance_level(self, rel_lvl: int = 1):
    """Sets relevance level."""
    self.qrels = _set_relevance_level(self.qrels, rel_lvl)

`sort()`

Sort. Used internally.

Source code in ranx/data_structures/qrels.py

def sort(self):
    """Sort. Used internally."""
    self.qrels = sort_dict_by_key(self.qrels)
    self.qrels = sort_dict_of_dict_by_value(self.qrels)
    self.sorted = True

`to_dataframe()`

Convert Qrels to Pandas DataFrame with the following columns: q_id, doc_id, and score.

Returns:

Type	Description
`DataFrame`	pandas.DataFrame: Qrels as Pandas DataFrame.

Source code in ranx/data_structures/qrels.py

def to_dataframe(self) -> pd.DataFrame:
    """Convert Qrels to Pandas DataFrame with the following columns: `q_id`, `doc_id`, and `score`.

    Returns:
        pandas.DataFrame: Qrels as Pandas DataFrame.
    """
    data = {"q_id": [], "doc_id": [], "score": []}

    for q_id in self.qrels:
        for doc_id in self.qrels[q_id]:
            data["q_id"].append(q_id)
            data["doc_id"].append(doc_id)
            data["score"].append(self.qrels[q_id][doc_id])

    return pd.DataFrame.from_dict(data)

`to_dict()`

Convert Qrels to Python dictionary.

Returns:

Type	Description
`Dict[str, Dict[str, int]]`	Dict[str, Dict[str, int]]: Qrels as Python dictionary

Source code in ranx/data_structures/qrels.py

def to_dict(self) -> Dict[str, Dict[str, int]]:
    """Convert Qrels to Python dictionary.

    Returns:
        Dict[str, Dict[str, int]]: Qrels as Python dictionary
    """
    d = defaultdict(dict)
    for q_id in self.keys():
        d[q_id] = dict(self[q_id])
    return d

`to_typed_list()`

Convert Qrels to Numba Typed List. Used internally.

Source code in ranx/data_structures/qrels.py

def to_typed_list(self):
    """Convert Qrels to Numba Typed List. Used internally."""
    if not self.sorted:
        self.sort()
    return to_typed_list(self.qrels)

`Run`

Bases: object

Run stores the relevance scores estimated by the model under evaluation.<r> The preferred way for creating a Run instance is converting a Python dictionary as follows:

run_dict = {
    "q_1": {
        "d_1": 1.5,
        "d_2": 2.6,
    },
    "q_2": {
        "d_3": 2.8,
        "d_2": 1.2,
        "d_5": 3.1,
    },
}

run = Run(run_dict, name="bm25")

run = Run()  # Creates an empty Run with no name

Source code in ranx/data_structures/run.py

class Run(object):
    """`Run` stores the relevance scores estimated by the model under evaluation.<\br>
    The preferred way for creating a `Run` instance is converting a Python dictionary as follows:

    ```python
    run_dict = {
        "q_1": {
            "d_1": 1.5,
            "d_2": 2.6,
        },
        "q_2": {
            "d_3": 2.8,
            "d_2": 1.2,
            "d_5": 3.1,
        },
    }

    run = Run(run_dict, name="bm25")

    run = Run()  # Creates an empty Run with no name
    ```
    """

    def __init__(self, run: Dict[str, Dict[str, float]] = None, name: str = None):
        if run is None:
            self.run = TypedDict.empty(
                key_type=types.unicode_type,
                value_type=types.DictType(types.unicode_type, types.float64),
            )
            self.sorted = False
        else:
            # Query IDs
            q_ids = list(run.keys())
            q_ids = TypedList(q_ids)

            # Doc IDs
            doc_ids = [list(doc.keys()) for doc in run.values()]
            max_len = max(len(y) for x in doc_ids for y in x)
            dtype = f"<U{max_len}"
            doc_ids = TypedList([np.array(x, dtype=dtype) for x in doc_ids])

            # Scores
            scores = [list(doc.values()) for doc in run.values()]
            scores = TypedList([np.array(x, dtype=float) for x in scores])
            self.run = create_and_sort(q_ids, doc_ids, scores)
            self.sorted = True

        self.name = name
        self.metadata = {}
        self.scores = defaultdict(dict)
        self.mean_scores = {}
        self.std_scores = {}

    def keys(self):
        """Returns query ids. Used internally."""
        return self.run.keys()

    def add_score(self, q_id: str, doc_id: str, score: int):
        """Add a (doc_id, score) pair to a query (or, change its value if it already exists).

        Args:
            q_id (str): Query ID
            doc_id (str): Document ID
            score (int): Relevance score
        """
        if self.run.get(q_id) is None:
            self.run[q_id] = TypedDict.empty(
                key_type=types.unicode_type,
                value_type=types.float64,
            )
        self.run[q_id][doc_id] = float(score)
        self.sorted = False

    def add(self, q_id: str, doc_ids: List[str], scores: List[float]):
        """Add a query and its relevant documents with the associated relevance score.

        Args:
            q_id (str): Query ID
            doc_ids (List[str]): List of Document IDs
            scores (List[int]): List of relevance scores
        """
        self.add_multi([q_id], [doc_ids], [scores])

    def add_multi(
        self,
        q_ids: List[str],
        doc_ids: List[List[str]],
        scores: List[List[float]],
    ):
        """Add multiple queries at once.

        Args:
            q_ids (List[str]): List of Query IDs
            doc_ids (List[List[str]]): List of list of Document IDs
            scores (List[List[int]]): List of list of relevance scores
        """
        q_ids = TypedList(q_ids)
        doc_ids = TypedList([TypedList(x) for x in doc_ids])
        scores = TypedList([TypedList(map(float, x)) for x in scores])

        self.run = add_and_sort(self.run, q_ids, doc_ids, scores)
        self.sorted = True

    def get_query_ids(self):
        """Returns query ids."""
        return list(self.run.keys())

    def get_doc_ids_and_scores(self):
        """Returns doc ids and relevance scores."""
        return list(self.run.values())

    # Sort in place
    def sort(self):
        """Sort. Used internally."""
        self.run = sort_dict_by_key(self.run)
        self.run = sort_dict_of_dict_by_value(self.run)
        self.sorted = True

    def make_comparable(self, qrels: Qrels):
        """Adds empty results for queries missing from the run and removes those not appearing in qrels."""
        # Adds empty results for missing queries
        for q_id in qrels.qrels:
            if q_id not in self.run:
                self.run[q_id] = create_empty_results_dict()

        # Remove results for additional queries
        for q_id in self.run:
            if q_id not in qrels.qrels:
                del self.run[q_id]

        self.sort()

        return self

    def to_typed_list(self):
        """Convert Run to Numba Typed List. Used internally."""
        if not self.sorted:
            self.sort()
        return to_typed_list(self.run)

    def to_dict(self):
        """Convert Run to Python dictionary.

        Returns:
            Dict[str, Dict[str, int]]: Run as Python dictionary
        """
        d = defaultdict(dict)
        for q_id in self.keys():
            d[q_id] = dict(self[q_id])
        return d

    def to_dataframe(self) -> pd.DataFrame:
        """Convert Run to Pandas DataFrame with the following columns: `q_id`, `doc_id`, and `score`.

        Returns:
            pandas.DataFrame: Run as Pandas DataFrame.
        """
        data = {"q_id": [], "doc_id": [], "score": []}

        for q_id in self.run:
            for doc_id in self.run[q_id]:
                data["q_id"].append(q_id)
                data["doc_id"].append(doc_id)
                data["score"].append(self.run[q_id][doc_id])

        return pd.DataFrame.from_dict(data)

    def save(self, path: str = "run.json", kind: str = None):
        """Write `run` to `path` as JSON file, TREC run, LZ4 file, or Parquet file. File type is automatically inferred form the filename extension: ".json" -> "json", ".trec" -> "trec", ".txt" -> "trec", and ".lz4" -> "lz4", ".parq" -> "parquet", ".parquet" -> "parquet". Use the "kind" argument to override this behavior.

        Args:
            path (str, optional): Saving path. Defaults to "run.json".
            kind (str, optional): Kind of file to save, must be either "json", "trec", or "ranxhub". If None, it will be automatically inferred from the filename extension.
        """
        # Infer file extension -------------------------------------------------
        kind = get_file_kind(path, kind)

        # Save Run -------------------------------------------------------------
        if not self.sorted:
            self.sort()

        if kind == "json":
            save_json(self.to_dict(), path)
        elif kind == "lz4":
            save_lz4(self.to_dict(), path)
        elif kind == "parquet":
            self.to_dataframe().to_parquet(path, index=False)
        else:
            with open(path, "w") as f:
                for i, q_id in enumerate(self.run.keys()):
                    for rank, doc_id in enumerate(self.run[q_id].keys()):
                        score = self.run[q_id][doc_id]
                        f.write(f"{q_id} Q0 {doc_id} {rank+1} {score} {self.name}")

                        if (
                            i != len(self.run.keys()) - 1
                            or rank != len(self.run[q_id].keys()) - 1
                        ):
                            f.write("\n")

    @staticmethod
    def from_dict(d: Dict[str, Dict[str, float]], name: str = None):
        """Convert a Python dictionary in form of {q_id: {doc_id: score}} to ranx.Run.

        Args:
            d (Dict[str, Dict[str, int]]): Run as Python dictionary
            name (str, optional): Run name. Defaults to None.

        Returns:
            Run: ranx.Run
        """

        # Query IDs
        q_ids = list(d.keys())
        q_ids = TypedList(q_ids)

        # Doc IDs
        doc_ids = [list(doc.keys()) for doc in d.values()]
        max_len = max(len(y) for x in doc_ids for y in x)
        dtype = f"<U{max_len}"
        doc_ids = TypedList([np.array(x, dtype=dtype) for x in doc_ids])

        # Scores
        scores = [list(doc.values()) for doc in d.values()]
        scores = TypedList([np.array(x, dtype=float) for x in scores])

        run = Run()
        run.run = create_and_sort(q_ids, doc_ids, scores)
        run.sorted = True
        run.name = name

        return run

    @staticmethod
    def from_file(path: str, kind: str = None, name: str = None):
        """Parse a run file into ranx.Run. Supported formats are JSON, TREC run, gzipped TREC run, and LZ4. Correct import behavior is inferred from the file extension: ".json" -> "json", ".trec" -> "trec", ".txt" -> "trec", ".gz" -> "gzipped trec", ".lz4" -> "lz4". Use the "kind" argument to override this behavior.

        Args:
            path (str): File path.
            kind (str, optional): Kind of file to load, must be either "json" or "trec".
            name (str, optional): Run name. Defaults to None.

        Returns:
            Run: ranx.Run
        """
        # Infer file extension -------------------------------------------------
        kind = get_file_kind(path, kind)

        # Load Run -------------------------------------------------------------
        if kind == "json":
            run = load_json(path)
        elif kind == "lz4":
            run = load_lz4(path)
        else:
            run = defaultdict(dict)
            with gzip.open(path, "rt") if kind == "gz" else open(path) as f:
                for line in f:
                    q_id, _, doc_id, _, rel, run_name = line.split()
                    run[q_id][doc_id] = float(rel)
                    if name is None:
                        name = run_name

        run = Run.from_dict(run, name)

        return run

    @staticmethod
    def from_df(
        df: pd.DataFrame,
        q_id_col: str = "q_id",
        doc_id_col: str = "doc_id",
        score_col: str = "score",
        name: str = None,
    ):
        """Convert a Pandas DataFrame to ranx.Run.

        Args:
            df (pd.DataFrame): Run as Pandas DataFrame
            q_id_col (str, optional): Query IDs column. Defaults to "q_id".
            doc_id_col (str, optional): Document IDs column. Defaults to "doc_id".
            score_col (str, optional): Relevance scores column. Defaults to "score".
            name (str, optional): Run name. Defaults to None.

        Returns:
            Run: ranx.Run
        """
        assert (
            df[q_id_col].dtype == "O"
        ), "DataFrame Query IDs column dtype must be `object` (string)"
        assert (
            df[doc_id_col].dtype == "O"
        ), "DataFrame Document IDs column dtype must be `object` (string)"
        assert (
            df[score_col].dtype == np.float64
        ), "DataFrame scores column dtype must be `float`"

        run_py = (
            df.groupby(q_id_col)[[doc_id_col, score_col]]
            .apply(lambda g: {x[0]: x[1] for x in g.values.tolist()})
            .to_dict()
        )

        return Run.from_dict(run_py, name)

    @staticmethod
    def from_parquet(
        path: str,
        q_id_col: str = "q_id",
        doc_id_col: str = "doc_id",
        score_col: str = "score",
        pd_kwargs: Dict[str, Any] = None,
        name: str = None,
    ):
        """Convert a Parquet file to ranx.Run.

        Args:
            path (str): File path.
            q_id_col (str, optional): Query IDs column. Defaults to "q_id".
            doc_id_col (str, optional): Document IDs column. Defaults to "doc_id".
            score_col (str, optional): Relevance scores column. Defaults to "score".
            pd_kwargs (Dict[str, Any], optional): Additional arguments to pass to `pandas.read_parquet` (see https://pandas.pydata.org/docs/reference/api/pandas.read_parquet.html). Defaults to None.
            name (str, optional): Run name. Defaults to None.

        Returns:
            Run: ranx.Run
        """
        pd_kwargs = {} if pd_kwargs is None else pd_kwargs

        return Run.from_df(
            df=pd.read_parquet(path, *pd_kwargs),
            q_id_col=q_id_col,
            doc_id_col=doc_id_col,
            score_col=score_col,
            name=name,
        )

    @staticmethod
    def from_ranxhub(id: str):
        """Download and load a ranx.Run from ranxhub.

        Args:
            path (str): Run ID.

        Returns:
            Run: ranx.Run
        """
        content = download(id)

        run = Run.from_dict(content["run"])
        run.name = content["metadata"]["run"]["name"]
        run.metadata = content["metadata"]

        return run

    @property
    def size(self):
        return len(self.run)

    def __getitem__(self, q_id):
        return dict(self.run[q_id])

    def __len__(self) -> int:
        return len(self.run)

    def __repr__(self):
        return self.run.__repr__()

    def __str__(self):
        return self.run.__str__()

`add(q_id, doc_ids, scores)`

Add a query and its relevant documents with the associated relevance score.

Parameters:

Name	Type	Description	Default
`q_id`	`str`	Query ID	required
`doc_ids`	`List[str]`	List of Document IDs	required
`scores`	`List[int]`	List of relevance scores	required

Source code in ranx/data_structures/run.py

def add(self, q_id: str, doc_ids: List[str], scores: List[float]):
    """Add a query and its relevant documents with the associated relevance score.

    Args:
        q_id (str): Query ID
        doc_ids (List[str]): List of Document IDs
        scores (List[int]): List of relevance scores
    """
    self.add_multi([q_id], [doc_ids], [scores])

`add_multi(q_ids, doc_ids, scores)`

Add multiple queries at once.

Parameters:

Name	Type	Description	Default
`q_ids`	`List[str]`	List of Query IDs	required
`doc_ids`	`List[List[str]]`	List of list of Document IDs	required
`scores`	`List[List[int]]`	List of list of relevance scores	required

Source code in ranx/data_structures/run.py

def add_multi(
    self,
    q_ids: List[str],
    doc_ids: List[List[str]],
    scores: List[List[float]],
):
    """Add multiple queries at once.

    Args:
        q_ids (List[str]): List of Query IDs
        doc_ids (List[List[str]]): List of list of Document IDs
        scores (List[List[int]]): List of list of relevance scores
    """
    q_ids = TypedList(q_ids)
    doc_ids = TypedList([TypedList(x) for x in doc_ids])
    scores = TypedList([TypedList(map(float, x)) for x in scores])

    self.run = add_and_sort(self.run, q_ids, doc_ids, scores)
    self.sorted = True

`add_score(q_id, doc_id, score)`

Add a (doc_id, score) pair to a query (or, change its value if it already exists).

Parameters:

Name	Type	Description	Default
`q_id`	`str`	Query ID	required
`doc_id`	`str`	Document ID	required
`score`	`int`	Relevance score	required

Source code in ranx/data_structures/run.py

def add_score(self, q_id: str, doc_id: str, score: int):
    """Add a (doc_id, score) pair to a query (or, change its value if it already exists).

    Args:
        q_id (str): Query ID
        doc_id (str): Document ID
        score (int): Relevance score
    """
    if self.run.get(q_id) is None:
        self.run[q_id] = TypedDict.empty(
            key_type=types.unicode_type,
            value_type=types.float64,
        )
    self.run[q_id][doc_id] = float(score)
    self.sorted = False

`from_df(df, q_id_col='q_id', doc_id_col='doc_id', score_col='score', name=None)` `staticmethod`

Convert a Pandas DataFrame to ranx.Run.

Parameters:

Name	Type	Description	Default
`df`	`DataFrame`	Run as Pandas DataFrame	required
`q_id_col`	`str`	Query IDs column. Defaults to "q_id".	`'q_id'`
`doc_id_col`	`str`	Document IDs column. Defaults to "doc_id".	`'doc_id'`
`score_col`	`str`	Relevance scores column. Defaults to "score".	`'score'`
`name`	`str`	Run name. Defaults to None.	`None`

Returns:

Name	Type	Description
`Run`		ranx.Run

Source code in ranx/data_structures/run.py

@staticmethod
def from_df(
    df: pd.DataFrame,
    q_id_col: str = "q_id",
    doc_id_col: str = "doc_id",
    score_col: str = "score",
    name: str = None,
):
    """Convert a Pandas DataFrame to ranx.Run.

    Args:
        df (pd.DataFrame): Run as Pandas DataFrame
        q_id_col (str, optional): Query IDs column. Defaults to "q_id".
        doc_id_col (str, optional): Document IDs column. Defaults to "doc_id".
        score_col (str, optional): Relevance scores column. Defaults to "score".
        name (str, optional): Run name. Defaults to None.

    Returns:
        Run: ranx.Run
    """
    assert (
        df[q_id_col].dtype == "O"
    ), "DataFrame Query IDs column dtype must be `object` (string)"
    assert (
        df[doc_id_col].dtype == "O"
    ), "DataFrame Document IDs column dtype must be `object` (string)"
    assert (
        df[score_col].dtype == np.float64
    ), "DataFrame scores column dtype must be `float`"

    run_py = (
        df.groupby(q_id_col)[[doc_id_col, score_col]]
        .apply(lambda g: {x[0]: x[1] for x in g.values.tolist()})
        .to_dict()
    )

    return Run.from_dict(run_py, name)

`from_dict(d, name=None)` `staticmethod`

Convert a Python dictionary in form of {q_id: {doc_id: score}} to ranx.Run.

Parameters:

Name	Type	Description	Default
`d`	`Dict[str, Dict[str, int]]`	Run as Python dictionary	required
`name`	`str`	Run name. Defaults to None.	`None`

Returns:

Name	Type	Description
`Run`		ranx.Run

Source code in ranx/data_structures/run.py

@staticmethod
def from_dict(d: Dict[str, Dict[str, float]], name: str = None):
    """Convert a Python dictionary in form of {q_id: {doc_id: score}} to ranx.Run.

    Args:
        d (Dict[str, Dict[str, int]]): Run as Python dictionary
        name (str, optional): Run name. Defaults to None.

    Returns:
        Run: ranx.Run
    """

    # Query IDs
    q_ids = list(d.keys())
    q_ids = TypedList(q_ids)

    # Doc IDs
    doc_ids = [list(doc.keys()) for doc in d.values()]
    max_len = max(len(y) for x in doc_ids for y in x)
    dtype = f"<U{max_len}"
    doc_ids = TypedList([np.array(x, dtype=dtype) for x in doc_ids])

    # Scores
    scores = [list(doc.values()) for doc in d.values()]
    scores = TypedList([np.array(x, dtype=float) for x in scores])

    run = Run()
    run.run = create_and_sort(q_ids, doc_ids, scores)
    run.sorted = True
    run.name = name

    return run

`from_file(path, kind=None, name=None)` `staticmethod`

Parse a run file into ranx.Run. Supported formats are JSON, TREC run, gzipped TREC run, and LZ4. Correct import behavior is inferred from the file extension: ".json" -> "json", ".trec" -> "trec", ".txt" -> "trec", ".gz" -> "gzipped trec", ".lz4" -> "lz4". Use the "kind" argument to override this behavior.

Parameters:

Name	Type	Description	Default
`path`	`str`	File path.	required
`kind`	`str`	Kind of file to load, must be either "json" or "trec".	`None`
`name`	`str`	Run name. Defaults to None.	`None`

Returns:

Name	Type	Description
`Run`		ranx.Run

Source code in ranx/data_structures/run.py

@staticmethod
def from_file(path: str, kind: str = None, name: str = None):
    """Parse a run file into ranx.Run. Supported formats are JSON, TREC run, gzipped TREC run, and LZ4. Correct import behavior is inferred from the file extension: ".json" -> "json", ".trec" -> "trec", ".txt" -> "trec", ".gz" -> "gzipped trec", ".lz4" -> "lz4". Use the "kind" argument to override this behavior.

    Args:
        path (str): File path.
        kind (str, optional): Kind of file to load, must be either "json" or "trec".
        name (str, optional): Run name. Defaults to None.

    Returns:
        Run: ranx.Run
    """
    # Infer file extension -------------------------------------------------
    kind = get_file_kind(path, kind)

    # Load Run -------------------------------------------------------------
    if kind == "json":
        run = load_json(path)
    elif kind == "lz4":
        run = load_lz4(path)
    else:
        run = defaultdict(dict)
        with gzip.open(path, "rt") if kind == "gz" else open(path) as f:
            for line in f:
                q_id, _, doc_id, _, rel, run_name = line.split()
                run[q_id][doc_id] = float(rel)
                if name is None:
                    name = run_name

    run = Run.from_dict(run, name)

    return run

`from_parquet(path, q_id_col='q_id', doc_id_col='doc_id', score_col='score', pd_kwargs=None, name=None)` `staticmethod`

Convert a Parquet file to ranx.Run.

Parameters:

Name	Type	Description	Default
`path`	`str`	File path.	required
`q_id_col`	`str`	Query IDs column. Defaults to "q_id".	`'q_id'`
`doc_id_col`	`str`	Document IDs column. Defaults to "doc_id".	`'doc_id'`
`score_col`	`str`	Relevance scores column. Defaults to "score".	`'score'`
`pd_kwargs`	`Dict[str, Any]`	Additional arguments to pass to `pandas.read_parquet` (see https://pandas.pydata.org/docs/reference/api/pandas.read_parquet.html). Defaults to None.	`None`
`name`	`str`	Run name. Defaults to None.	`None`

Returns:

Name	Type	Description
`Run`		ranx.Run

Source code in ranx/data_structures/run.py

@staticmethod
def from_parquet(
    path: str,
    q_id_col: str = "q_id",
    doc_id_col: str = "doc_id",
    score_col: str = "score",
    pd_kwargs: Dict[str, Any] = None,
    name: str = None,
):
    """Convert a Parquet file to ranx.Run.

    Args:
        path (str): File path.
        q_id_col (str, optional): Query IDs column. Defaults to "q_id".
        doc_id_col (str, optional): Document IDs column. Defaults to "doc_id".
        score_col (str, optional): Relevance scores column. Defaults to "score".
        pd_kwargs (Dict[str, Any], optional): Additional arguments to pass to `pandas.read_parquet` (see https://pandas.pydata.org/docs/reference/api/pandas.read_parquet.html). Defaults to None.
        name (str, optional): Run name. Defaults to None.

    Returns:
        Run: ranx.Run
    """
    pd_kwargs = {} if pd_kwargs is None else pd_kwargs

    return Run.from_df(
        df=pd.read_parquet(path, *pd_kwargs),
        q_id_col=q_id_col,
        doc_id_col=doc_id_col,
        score_col=score_col,
        name=name,
    )

`from_ranxhub(id)` `staticmethod`

Download and load a ranx.Run from ranxhub.

Parameters:

Name	Type	Description	Default
`path`	`str`	Run ID.	required

Returns:

Name	Type	Description
`Run`		ranx.Run

Source code in ranx/data_structures/run.py

@staticmethod
def from_ranxhub(id: str):
    """Download and load a ranx.Run from ranxhub.

    Args:
        path (str): Run ID.

    Returns:
        Run: ranx.Run
    """
    content = download(id)

    run = Run.from_dict(content["run"])
    run.name = content["metadata"]["run"]["name"]
    run.metadata = content["metadata"]

    return run

`get_doc_ids_and_scores()`

Returns doc ids and relevance scores.

Source code in ranx/data_structures/run.py

def get_doc_ids_and_scores(self):
    """Returns doc ids and relevance scores."""
    return list(self.run.values())

`get_query_ids()`

Returns query ids.

Source code in ranx/data_structures/run.py

def get_query_ids(self):
    """Returns query ids."""
    return list(self.run.keys())

`keys()`

Returns query ids. Used internally.

Source code in ranx/data_structures/run.py

def keys(self):
    """Returns query ids. Used internally."""
    return self.run.keys()

`make_comparable(qrels)`

Adds empty results for queries missing from the run and removes those not appearing in qrels.

Source code in ranx/data_structures/run.py

def make_comparable(self, qrels: Qrels):
    """Adds empty results for queries missing from the run and removes those not appearing in qrels."""
    # Adds empty results for missing queries
    for q_id in qrels.qrels:
        if q_id not in self.run:
            self.run[q_id] = create_empty_results_dict()

    # Remove results for additional queries
    for q_id in self.run:
        if q_id not in qrels.qrels:
            del self.run[q_id]

    self.sort()

    return self

`save(path='run.json', kind=None)`

Write run to path as JSON file, TREC run, LZ4 file, or Parquet file. File type is automatically inferred form the filename extension: ".json" -> "json", ".trec" -> "trec", ".txt" -> "trec", and ".lz4" -> "lz4", ".parq" -> "parquet", ".parquet" -> "parquet". Use the "kind" argument to override this behavior.

Parameters:

Name	Type	Description	Default
`path`	`str`	Saving path. Defaults to "run.json".	`'run.json'`
`kind`	`str`	Kind of file to save, must be either "json", "trec", or "ranxhub". If None, it will be automatically inferred from the filename extension.	`None`

Source code in ranx/data_structures/run.py

def save(self, path: str = "run.json", kind: str = None):
    """Write `run` to `path` as JSON file, TREC run, LZ4 file, or Parquet file. File type is automatically inferred form the filename extension: ".json" -> "json", ".trec" -> "trec", ".txt" -> "trec", and ".lz4" -> "lz4", ".parq" -> "parquet", ".parquet" -> "parquet". Use the "kind" argument to override this behavior.

    Args:
        path (str, optional): Saving path. Defaults to "run.json".
        kind (str, optional): Kind of file to save, must be either "json", "trec", or "ranxhub". If None, it will be automatically inferred from the filename extension.
    """
    # Infer file extension -------------------------------------------------
    kind = get_file_kind(path, kind)

    # Save Run -------------------------------------------------------------
    if not self.sorted:
        self.sort()

    if kind == "json":
        save_json(self.to_dict(), path)
    elif kind == "lz4":
        save_lz4(self.to_dict(), path)
    elif kind == "parquet":
        self.to_dataframe().to_parquet(path, index=False)
    else:
        with open(path, "w") as f:
            for i, q_id in enumerate(self.run.keys()):
                for rank, doc_id in enumerate(self.run[q_id].keys()):
                    score = self.run[q_id][doc_id]
                    f.write(f"{q_id} Q0 {doc_id} {rank+1} {score} {self.name}")

                    if (
                        i != len(self.run.keys()) - 1
                        or rank != len(self.run[q_id].keys()) - 1
                    ):
                        f.write("\n")

`sort()`

Sort. Used internally.

Source code in ranx/data_structures/run.py

def sort(self):
    """Sort. Used internally."""
    self.run = sort_dict_by_key(self.run)
    self.run = sort_dict_of_dict_by_value(self.run)
    self.sorted = True

`to_dataframe()`

Convert Run to Pandas DataFrame with the following columns: q_id, doc_id, and score.

Returns:

Type	Description
`DataFrame`	pandas.DataFrame: Run as Pandas DataFrame.

Source code in ranx/data_structures/run.py

def to_dataframe(self) -> pd.DataFrame:
    """Convert Run to Pandas DataFrame with the following columns: `q_id`, `doc_id`, and `score`.

    Returns:
        pandas.DataFrame: Run as Pandas DataFrame.
    """
    data = {"q_id": [], "doc_id": [], "score": []}

    for q_id in self.run:
        for doc_id in self.run[q_id]:
            data["q_id"].append(q_id)
            data["doc_id"].append(doc_id)
            data["score"].append(self.run[q_id][doc_id])

    return pd.DataFrame.from_dict(data)

`to_dict()`

Convert Run to Python dictionary.

Returns:

Type	Description
	Dict[str, Dict[str, int]]: Run as Python dictionary

Source code in ranx/data_structures/run.py

def to_dict(self):
    """Convert Run to Python dictionary.

    Returns:
        Dict[str, Dict[str, int]]: Run as Python dictionary
    """
    d = defaultdict(dict)
    for q_id in self.keys():
        d[q_id] = dict(self[q_id])
    return d

`to_typed_list()`

Convert Run to Numba Typed List. Used internally.

Source code in ranx/data_structures/run.py

def to_typed_list(self):
    """Convert Run to Numba Typed List. Used internally."""
    if not self.sorted:
        self.sort()
    return to_typed_list(self.run)

`evaluate(qrels, run, metrics, return_mean=True, return_std=False, threads=0, save_results_in_run=True, make_comparable=False)`

Compute the performance scores for the provided qrels and run for all the specified metrics.

Usage examples:

from ranx import evaluate

Compute score for a single metric

evaluate(qrels, run, "ndcg@5")

0.7861

Compute scores for multiple metrics at once

evaluate(qrels, run, ["map@5", "mrr"])

{"map@5": 0.6416, "mrr": 0.75}

Computed metric scores are saved in the Run object

run.mean_scores

{"ndcg@5": 0.7861, "map@5": 0.6416, "mrr": 0.75}

Access scores for each query

dict(run.scores)

{ ... "ndcg@5": {"q_1": 0.9430, "q_2": 0.6292}, ... "map@5": {"q_1": 0.8333, "q_2": 0.4500}, ... "mrr": {"q_1": 1.0000, "q_2": 0.5000}, ... } Args: qrels (Union[ Qrels, Dict[str, Dict[str, Number]], nb.typed.typedlist.List, np.ndarray, ]): Qrels. run (Union[ Run, Dict[str, Dict[str, Number]], nb.typed.typedlist.List, np.ndarray, ]): Run. metrics (Union[List[str], str]): Metrics or list of metric to compute. return_mean (bool, optional): Whether to return the metric scores averaged over the query set or the scores for individual queries. Defaults to True. threads (int, optional): Number of threads to use, zero means all the available threads. Defaults to 0. save_results_in_run (bool, optional): Save metric scores for each query in the input run. Defaults to True. make_comparable (bool, optional): Adds empty results for queries missing from the run and removes those not appearing in qrels. Defaults to False.

Returns:

Type	Description
`Union[Dict[str, float], float]`	Union[Dict[str, float], float]: Results.

Source code in ranx/meta/evaluate.py

def evaluate(
    qrels: Union[
        Qrels,
        Dict[str, Dict[str, Number]],
        nb.typed.typedlist.List,
        np.ndarray,
    ],
    run: Union[
        Run,
        Dict[str, Dict[str, Number]],
        nb.typed.typedlist.List,
        np.ndarray,
    ],
    metrics: Union[List[str], str],
    return_mean: bool = True,
    return_std: bool = False,
    threads: int = 0,
    save_results_in_run: bool = True,
    make_comparable: bool = False,
) -> Union[Dict[str, float], float]:
    """Compute the performance scores for the provided `qrels` and `run` for all the specified metrics.

    Usage examples:

    from ranx import evaluate

    # Compute score for a single metric
    evaluate(qrels, run, "ndcg@5")
    >>> 0.7861

    # Compute scores for multiple metrics at once
    evaluate(qrels, run, ["map@5", "mrr"])
    >>> {"map@5": 0.6416, "mrr": 0.75}

    # Computed metric scores are saved in the Run object
    run.mean_scores
    >>> {"ndcg@5": 0.7861, "map@5": 0.6416, "mrr": 0.75}

    # Access scores for each query
    dict(run.scores)
    >>> {
    ...     "ndcg@5": {"q_1": 0.9430, "q_2": 0.6292},
    ...     "map@5": {"q_1": 0.8333, "q_2": 0.4500},
    ...     "mrr": {"q_1": 1.0000, "q_2": 0.5000},
    ... }
    Args:
        qrels (Union[ Qrels, Dict[str, Dict[str, Number]], nb.typed.typedlist.List, np.ndarray, ]): Qrels.
        run (Union[ Run, Dict[str, Dict[str, Number]], nb.typed.typedlist.List, np.ndarray, ]): Run.
        metrics (Union[List[str], str]): Metrics or list of metric to compute.
        return_mean (bool, optional): Whether to return the metric scores averaged over the query set or the scores for individual queries. Defaults to True.
        threads (int, optional): Number of threads to use, zero means all the available threads. Defaults to 0.
        save_results_in_run (bool, optional): Save metric scores for each query in the input `run`. Defaults to True.
        make_comparable (bool, optional): Adds empty results for queries missing from the run and removes those not appearing in qrels. Defaults to False.

    Returns:
        Union[Dict[str, float], float]: Results.
    """

    if len(qrels) < 10:
        set_num_threads(1)
    elif threads != 0:
        set_num_threads(threads)

    if not return_mean:
        return_std = False

    if make_comparable and type(qrels) == Qrels and type(run) == Run:
        run = run.make_comparable(qrels)

    if type(qrels) in [Qrels, dict] and type(run) in [Run, dict]:
        check_keys(qrels, run)

    _qrels = convert_qrels(qrels)
    _run = convert_run(run)
    metrics = format_metrics(metrics)
    assert all(isinstance(m, str) for m in metrics), "Metrics error"

    # Compute metrics ----------------------------------------------------------
    metric_scores_dict = {}
    for metric in metrics:
        m, k, rel_lvl = extract_metric_and_params(metric)
        metric_scores_dict[metric] = metric_switch(m)(_qrels, _run, k, rel_lvl)

    # Save results in Run ------------------------------------------------------
    if type(run) == Run and save_results_in_run:
        for m, scores in metric_scores_dict.items():
            run.mean_scores[m] = np.mean(scores)
            if return_std:
                run.std_scores[m] = np.std(scores)
            for i, q_id in enumerate(run.get_query_ids()):
                run.scores[m][q_id] = scores[i]

    # Prepare output -----------------------------------------------------------
    if return_mean:
        for m, scores in metric_scores_dict.items():
            if return_std:
                metric_scores_dict[m] = {
                    "mean": np.mean(scores),
                    "std": np.std(scores),
                }

            else:
                metric_scores_dict[m] = np.mean(scores)

    return metric_scores_dict[m] if len(metrics) == 1 else metric_scores_dict

`python_dict_to_typed_list(x, sort=True)`

Converts a nested Python Dictionary to Numba Typed List to be used with ranx's metrics with no effort.

Note: Doc IDs will be hashed.

Source code in ranx/utils.py

def python_dict_to_typed_list(x: Dict[str, Dict[str, Number]], sort: bool = True):
    """Converts a nested Python Dictionary to Numba Typed List to be used with ranx's metrics with no effort.

    Note: Doc IDs will be hashed.
    """
    out = TypedList(
        [
            np.array(
                [[hash(doc_id), score] for doc_id, score in doc.items()],
                dtype=np.float64,
            )
            for doc in x.values()
        ]
    )

    if sort:
        out = descending_sort_parallel(out)

    return out

Evaluate

Qrels

add(q_id, doc_ids, scores)

add_multi(q_ids, doc_ids, scores)

add_score(q_id, doc_id, score)

from_df(df, q_id_col='q_id', doc_id_col='doc_id', score_col='score') staticmethod

from_dict(d) staticmethod

from_file(path, kind=None) staticmethod

from_ir_datasets(dataset_id) staticmethod

from_parquet(path, q_id_col='q_id', doc_id_col='doc_id', score_col='score', pd_kwargs=None) staticmethod

get_doc_ids_and_scores()

get_query_ids()

keys()

save(path='qrels.json', kind=None)

set_relevance_level(rel_lvl=1)

sort()

to_dataframe()

to_dict()

to_typed_list()

Run

add(q_id, doc_ids, scores)

add_multi(q_ids, doc_ids, scores)

add_score(q_id, doc_id, score)

from_df(df, q_id_col='q_id', doc_id_col='doc_id', score_col='score', name=None) staticmethod

from_dict(d, name=None) staticmethod

from_file(path, kind=None, name=None) staticmethod

from_parquet(path, q_id_col='q_id', doc_id_col='doc_id', score_col='score', pd_kwargs=None, name=None) staticmethod

from_ranxhub(id) staticmethod

get_doc_ids_and_scores()

get_query_ids()

keys()

make_comparable(qrels)

save(path='run.json', kind=None)

sort()

to_dataframe()

to_dict()

to_typed_list()

evaluate(qrels, run, metrics, return_mean=True, return_std=False, threads=0, save_results_in_run=True, make_comparable=False)

Compute score for a single metric

Compute scores for multiple metrics at once

Computed metric scores are saved in the Run object

Access scores for each query

python_dict_to_typed_list(x, sort=True)

`Qrels`

`add(q_id, doc_ids, scores)`

`add_multi(q_ids, doc_ids, scores)`

`add_score(q_id, doc_id, score)`

`from_df(df, q_id_col='q_id', doc_id_col='doc_id', score_col='score')` `staticmethod`

`from_dict(d)` `staticmethod`

`from_file(path, kind=None)` `staticmethod`

`from_ir_datasets(dataset_id)` `staticmethod`

`from_parquet(path, q_id_col='q_id', doc_id_col='doc_id', score_col='score', pd_kwargs=None)` `staticmethod`

`get_doc_ids_and_scores()`

`get_query_ids()`

`keys()`

`save(path='qrels.json', kind=None)`

`set_relevance_level(rel_lvl=1)`

`sort()`

`to_dataframe()`

`to_dict()`

`to_typed_list()`

`Run`

`add(q_id, doc_ids, scores)`

`add_multi(q_ids, doc_ids, scores)`

`add_score(q_id, doc_id, score)`

`from_df(df, q_id_col='q_id', doc_id_col='doc_id', score_col='score', name=None)` `staticmethod`

`from_dict(d, name=None)` `staticmethod`

`from_file(path, kind=None, name=None)` `staticmethod`

`from_parquet(path, q_id_col='q_id', doc_id_col='doc_id', score_col='score', pd_kwargs=None, name=None)` `staticmethod`

`from_ranxhub(id)` `staticmethod`

`get_doc_ids_and_scores()`

`get_query_ids()`

`keys()`

`make_comparable(qrels)`

`save(path='run.json', kind=None)`

`sort()`

`to_dataframe()`

`to_dict()`

`to_typed_list()`

`evaluate(qrels, run, metrics, return_mean=True, return_std=False, threads=0, save_results_in_run=True, make_comparable=False)`

`python_dict_to_typed_list(x, sort=True)`