evaluation_factory

Evaluation factory module.

This module is responsible to provide an evaluation factory, which is responsible to create an evaluation object with the metrics of a search string generated by SeSG.

`Evaluation` `dataclass`

Evaluation of a search string.

Parameters:

Name	Type	Description	Default
`n_scopus_results`	`int`	Number of results returned by Scopus.	required
`gs_size`	`int`	Size of the gold standard.	required
`qgs_in_scopus`	`list[Study]`	QGS studies that were found in Scopus.	`field(default_factory=list)`
`gs_in_scopus`	`list[Study]`	GS studies that were found in Scopus.	`field(default_factory=list)`
`gs_in_bsb`	`list[Study]`	GS studies that were found via backward snowballing.	`field(default_factory=list)`
`gs_in_sb`	`list[Study]`	GS studies that were found via backward and forward snowballing.	`field(default_factory=list)`

Source code in src/sesg/evaluation/evaluation_factory.py

@dataclass(frozen=True)
class Evaluation:
    """Evaluation of a search string.

    Args:
        n_scopus_results (int): Number of results returned by Scopus.
        gs_size (int): Size of the gold standard.
        qgs_in_scopus (list[Study]): QGS studies that were found in Scopus.
        gs_in_scopus (list[Study]): GS studies that were found in Scopus.
        gs_in_bsb (list[Study]): GS studies that were found via backward snowballing.
        gs_in_sb (list[Study]): GS studies that were found via backward and forward snowballing.
    """  # noqa: E501

    n_scopus_results: int
    gs_size: int

    qgs_in_scopus: list[Study] = field(default_factory=list)
    gs_in_scopus: list[Study] = field(default_factory=list)
    gs_in_bsb: list[Study] = field(default_factory=list)
    gs_in_sb: list[Study] = field(default_factory=list)

    @cached_property
    def start_set_precision(self) -> float:
        """Start set precision.

        Ratio between the number of GS studies found in Scopus and the number of Scopus results.

        If the number of Scopus results is 0, then the precision is 0.
        """  # noqa: E501
        if self.n_scopus_results == 0:
            return 0

        return len(self.gs_in_scopus) / self.n_scopus_results

    @cached_property
    def start_set_recall(self) -> float:
        """Start set recall.

        Ratio between the number of GS studies found in Scopus and the size of the GS.
        """
        return len(self.gs_in_scopus) / self.gs_size

    @cached_property
    def start_set_f1_score(self) -> float:
        """Start set F1 score.

        A balanced metric between precision and recall.

        If both the start set precision and recall are 0, then the F1 score is 0.
        """
        precision = self.start_set_precision
        recall = self.start_set_recall

        numerator = 2 * precision * recall
        denominator = precision + recall

        if denominator == 0:
            return 0

        return numerator / denominator

    @cached_property
    def bsb_recall(self) -> float:
        """Recall considering backward snowballing.

        Ratio between the number of GS studies found in backward snowballing and the size of the GS.
        """  # noqa: E501
        return len(self.gs_in_bsb) / self.gs_size

    @cached_property
    def sb_recall(self) -> float:
        """Recall considering backward and forward snowballing.

        Ratio between the number of GS studies found in backward and forward snowballing and the size of the GS.
        """  # noqa: E501
        return len(self.gs_in_sb) / self.gs_size

`bsb_recall: float` `property` `cached`

Recall considering backward snowballing.

Ratio between the number of GS studies found in backward snowballing and the size of the GS.

`sb_recall: float` `property` `cached`

Recall considering backward and forward snowballing.

Ratio between the number of GS studies found in backward and forward snowballing and the size of the GS.

`start_set_f1_score: float` `property` `cached`

Start set F1 score.

A balanced metric between precision and recall.

If both the start set precision and recall are 0, then the F1 score is 0.

`start_set_precision: float` `property` `cached`

Start set precision.

Ratio between the number of GS studies found in Scopus and the number of Scopus results.

If the number of Scopus results is 0, then the precision is 0.

`start_set_recall: float` `property` `cached`

Start set recall.

Ratio between the number of GS studies found in Scopus and the size of the GS.

`EvaluationFactory` `dataclass`

Evaluation factory.

To evaluate a search string, use the evaluate method.

Parameters:

Name	Type	Description	Default
`gs`	`list[Study]`	Gold standard.	required
`qgs`	`list[Study]`	Quasi gold standard.	required

Source code in src/sesg/evaluation/evaluation_factory.py

@dataclass(frozen=True)
class EvaluationFactory:
    """Evaluation factory.

    To evaluate a search string, use the [`evaluate`][sesg.evaluation.evaluation_factory.EvaluationFactory.evaluate] method.

    Args:
        gs (list[Study]): Gold standard.
        qgs (list[Study]): Quasi gold standard.
    """  # noqa: E501

    gs: list[Study]
    qgs: list[Study]

    @cached_property
    def processed_gs_titles(self) -> list[str]:
        """Preprocessed GS titles."""
        return [s.processed_title for s in self.gs]

    @cached_property
    def processed_qgs_titles(self) -> list[str]:
        """Preprocessed QGS titles."""
        return [s.processed_title for s in self.qgs]

    @cached_property
    def studies_dict(self) -> dict[int, Study]:
        """Dictionary mapping a study ID to a study."""
        return {s.id: s for s in self.gs}

    def _get_study_by_id(self, id: int) -> Study:
        return self.studies_dict[id]

    @cached_property
    def directed_adjacency_list(self) -> dict[int, list[int]]:
        """Directed adjacency list of the GS."""
        return get_directed_adjacency_list_from_gs(self.gs)

    @cached_property
    def undirected_adjacency_list(self) -> dict[int, list[int]]:
        """Undirected adjacency list of the GS."""
        return directed_adjacency_list_to_undirected(self.directed_adjacency_list)

    def get_qgs_in_scopus(
        self,
        processed_scopus_titles: list[str],
    ) -> list[Study]:
        """Get QGS studies that were found in Scopus."""
        qgs_in_scopus = similarity_score(
            small_set=self.processed_qgs_titles,
            other_set=processed_scopus_titles,
        )

        return [self.qgs[id] for id, _ in qgs_in_scopus]

    def get_gs_in_scopus(
        self,
        processed_scopus_titles: list[str],
    ) -> list[Study]:
        """Get GS studies that were found in Scopus."""
        gs_in_scopus = similarity_score(
            small_set=self.processed_gs_titles,
            other_set=processed_scopus_titles,
        )

        return [self.gs[id] for id, _ in gs_in_scopus]

    def get_gs_in_bsb(
        self,
        gs_in_scopus: list[Study],
    ) -> list[Study]:
        """Get GS studies that were found via backward snowballing."""
        gs_in_bsb = snowballing(
            adjacency_list=self.directed_adjacency_list,
            start_set=[s.id for s in gs_in_scopus],
        )

        return [self._get_study_by_id(id) for id in gs_in_bsb]

    def get_gs_in_sb(
        self,
        gs_in_scopus: list[Study],
    ) -> list[Study]:
        """Get GS studies that were found via backward or forward snowballing."""
        gs_in_bsb = snowballing(
            adjacency_list=self.undirected_adjacency_list,
            start_set=[s.id for s in gs_in_scopus],
        )

        return [self._get_study_by_id(id) for id in gs_in_bsb]

    def evaluate(
        self,
        scopus_results: list[str],
    ) -> Evaluation:
        """Evaluate the performance of a search string using the results returned by Scopus.

        Args:
            scopus_results (list[str]): List with the titles of the studies returned by Scopus.

        Returns:
            An object with the evaluation metrics.
        """  # noqa: E501
        processed_scopus_titles = [process_title(title) for title in scopus_results]

        qgs_in_scopus = self.get_qgs_in_scopus(processed_scopus_titles)
        gs_in_scopus = self.get_gs_in_scopus(processed_scopus_titles)
        gs_in_bsb = self.get_gs_in_bsb(gs_in_scopus)
        gs_in_sb = self.get_gs_in_sb(gs_in_scopus)

        return Evaluation(
            qgs_in_scopus=qgs_in_scopus,
            gs_in_scopus=gs_in_scopus,
            gs_in_bsb=gs_in_bsb,
            gs_in_sb=gs_in_sb,
            gs_size=len(self.gs),
            n_scopus_results=len(scopus_results),
        )

`directed_adjacency_list: dict[int, list[int]]` `property` `cached`

Directed adjacency list of the GS.

`processed_gs_titles: list[str]` `property` `cached`

Preprocessed GS titles.

`processed_qgs_titles: list[str]` `property` `cached`

Preprocessed QGS titles.

`studies_dict: dict[int, Study]` `property` `cached`

Dictionary mapping a study ID to a study.

`undirected_adjacency_list: dict[int, list[int]]` `property` `cached`

Undirected adjacency list of the GS.

`evaluate(scopus_results)`

Evaluate the performance of a search string using the results returned by Scopus.

Parameters:

Name	Type	Description	Default
`scopus_results`	`list[str]`	List with the titles of the studies returned by Scopus.	required

Returns:

Type	Description
`Evaluation`	An object with the evaluation metrics.

Source code in src/sesg/evaluation/evaluation_factory.py

def evaluate(
    self,
    scopus_results: list[str],
) -> Evaluation:
    """Evaluate the performance of a search string using the results returned by Scopus.

    Args:
        scopus_results (list[str]): List with the titles of the studies returned by Scopus.

    Returns:
        An object with the evaluation metrics.
    """  # noqa: E501
    processed_scopus_titles = [process_title(title) for title in scopus_results]

    qgs_in_scopus = self.get_qgs_in_scopus(processed_scopus_titles)
    gs_in_scopus = self.get_gs_in_scopus(processed_scopus_titles)
    gs_in_bsb = self.get_gs_in_bsb(gs_in_scopus)
    gs_in_sb = self.get_gs_in_sb(gs_in_scopus)

    return Evaluation(
        qgs_in_scopus=qgs_in_scopus,
        gs_in_scopus=gs_in_scopus,
        gs_in_bsb=gs_in_bsb,
        gs_in_sb=gs_in_sb,
        gs_size=len(self.gs),
        n_scopus_results=len(scopus_results),
    )

`get_gs_in_bsb(gs_in_scopus)`

Get GS studies that were found via backward snowballing.

Source code in src/sesg/evaluation/evaluation_factory.py

def get_gs_in_bsb(
    self,
    gs_in_scopus: list[Study],
) -> list[Study]:
    """Get GS studies that were found via backward snowballing."""
    gs_in_bsb = snowballing(
        adjacency_list=self.directed_adjacency_list,
        start_set=[s.id for s in gs_in_scopus],
    )

    return [self._get_study_by_id(id) for id in gs_in_bsb]

`get_gs_in_sb(gs_in_scopus)`

Get GS studies that were found via backward or forward snowballing.

Source code in src/sesg/evaluation/evaluation_factory.py

def get_gs_in_sb(
    self,
    gs_in_scopus: list[Study],
) -> list[Study]:
    """Get GS studies that were found via backward or forward snowballing."""
    gs_in_bsb = snowballing(
        adjacency_list=self.undirected_adjacency_list,
        start_set=[s.id for s in gs_in_scopus],
    )

    return [self._get_study_by_id(id) for id in gs_in_bsb]

`get_gs_in_scopus(processed_scopus_titles)`

Get GS studies that were found in Scopus.

Source code in src/sesg/evaluation/evaluation_factory.py

def get_gs_in_scopus(
    self,
    processed_scopus_titles: list[str],
) -> list[Study]:
    """Get GS studies that were found in Scopus."""
    gs_in_scopus = similarity_score(
        small_set=self.processed_gs_titles,
        other_set=processed_scopus_titles,
    )

    return [self.gs[id] for id, _ in gs_in_scopus]

`get_qgs_in_scopus(processed_scopus_titles)`

Get QGS studies that were found in Scopus.

Source code in src/sesg/evaluation/evaluation_factory.py

def get_qgs_in_scopus(
    self,
    processed_scopus_titles: list[str],
) -> list[Study]:
    """Get QGS studies that were found in Scopus."""
    qgs_in_scopus = similarity_score(
        small_set=self.processed_qgs_titles,
        other_set=processed_scopus_titles,
    )

    return [self.qgs[id] for id, _ in qgs_in_scopus]

`Study` `dataclass`

Represents a study.

Parameters:

Name	Type	Description	Default
`id`	`int`	Study's ID.	required
`title`	`str`	Study's title.	required
`references`	`list[Study]`	Study's references. If None, defaults to an empty list.	`field(default_factory=list)`

Source code in src/sesg/evaluation/evaluation_factory.py

@dataclass(unsafe_hash=True)
class Study:
    """Represents a study.

    Args:
        id (int): Study's ID.
        title (str): Study's title.
        references (list[Study]): Study's references. If None, defaults to an empty list.
    """  # noqa: E501

    id: int
    title: str

    references: list["Study"] = field(default_factory=list)

    @cached_property
    def processed_title(self):
        """Preprocessed title."""
        return process_title(self.title)

`processed_title` `property` `cached`

Preprocessed title.

`get_directed_adjacency_list_from_gs(gs)`

Creates a directed adjacency list from a gold standard set of studies.

Parameters:

Name	Type	Description	Default
`gs`	`list[Study]`	Set of studies that compose the GS.	required

Returns:

Type	Description
`dict[int, list[int]]`	A dictionary mapping a study ID to it's references.

Source code in src/sesg/evaluation/evaluation_factory.py

def get_directed_adjacency_list_from_gs(
    gs: list["Study"],
) -> dict[int, list[int]]:
    """Creates a directed adjacency list from a gold standard set of studies.

    Args:
        gs (list[Study]): Set of studies that compose the GS.

    Returns:
        A dictionary mapping a study ID to it's references.
    """
    adjacency_list = {}

    for study in gs:
        adjacency_list[study.id] = [ref.id for ref in study.references]

    return adjacency_list

`process_title(string)`

Strips the string and turn every character to lower case.

Parameters:

Name	Type	Description	Default
`string`	`str`	The string to preprocess.	required

Returns:

Type	Description
`str`	The preprocessed string.

Examples:

>>> process_title(" A string Here.  \n")
'a string here.'

Source code in src/sesg/evaluation/evaluation_factory.py

def process_title(
    string: str,
) -> str:
    r"""Strips the string and turn every character to lower case.

    Args:
        string: The string to preprocess.

    Returns:
        The preprocessed string.

    Examples:
        >>> process_title(" A string Here.  \n")
        'a string here.'
    """
    return string.strip().lower()

`similarity_score(small_set, other_set)`

Uses TfidfVectorizer, cosine_similarity, and Levenshtein to calculate the intersection of two sets of strings.

You might need to preprocess the strings with process_title.

Parameters:

Name	Type	Description	Default
`small_set`	`list[str]`	Set of strings. If possible, the length of this set should be smaller than the other one.	required
`other_set`	`list[str]`	Set of strings to compare against.	required

Returns:

Type	Description
`list[tuple[int, int]]`	List of tuples, where the tuple `(i, j)` means that `small_set[i]` is similar to `other_set[j]`.

Examples:

>>> small_set = ["machine learning", "databases", "search strings"]
>>> other_set = ["Databases, an introduction", "Machine Learning", "Search String"]
>>> similarity_score(
...     small_set=small_set,
...     other_set=other_set
... )
[(0, 1), (2, 2)]

Source code in src/sesg/evaluation/evaluation_factory.py

def similarity_score(
    small_set: list[str],
    other_set: list[str],
) -> list[tuple[int, int]]:
    """Uses `TfidfVectorizer`, `cosine_similarity`, and `Levenshtein` to calculate the intersection of two sets of strings.

    You might need to preprocess the strings with [`process_title`][sesg.evaluation.evaluation_factory.process_title].

    Args:
        small_set (list[str]): Set of strings. If possible, the length of this set should be smaller than the other one.
        other_set (list[str]): Set of strings to compare against.

    Returns:
        List of tuples, where the tuple `(i, j)` means that `small_set[i]` is similar to `other_set[j]`.

    Examples:
        >>> small_set = ["machine learning", "databases", "search strings"]
        >>> other_set = ["Databases, an introduction", "Machine Learning", "Search String"]
        >>> similarity_score(
        ...     small_set=small_set,
        ...     other_set=other_set
        ... )
        [(0, 1), (2, 2)]
    """  # noqa: E501
    if len(other_set) == 0:
        return []

    train_set = [*small_set, *other_set]

    tfidf_vectorizer = TfidfVectorizer()
    tfidf_matrix = tfidf_vectorizer.fit_transform(train_set)

    first_set_matrix = tfidf_matrix[0 : len(small_set)]
    second_set_matrix = tfidf_matrix[len(small_set) : len(small_set) + len(other_set)]

    similarity_matrix = cosine_similarity(
        first_set_matrix,
        second_set_matrix,
    )

    lines: int
    lines, _ = similarity_matrix.shape

    similars: list[tuple[int, int]] = []

    for index_of_first_set_element in range(lines):
        # contains the row of the similarity matrix for the current element
        line = similarity_matrix[index_of_first_set_element]

        index_of_closest_element_in_second_set: int = argsort(line)[-1]

        first_set_element = small_set[index_of_first_set_element]
        second_set_element = other_set[index_of_closest_element_in_second_set]

        distance = Levenshtein.distance(
            first_set_element,
            second_set_element,
            score_cutoff=10,
        )

        if distance < 10:
            similars.append(
                (index_of_first_set_element, index_of_closest_element_in_second_set)
            )

    return similars

evaluation_factory

Evaluation dataclass

bsb_recall: float property cached

sb_recall: float property cached

start_set_f1_score: float property cached

start_set_precision: float property cached

start_set_recall: float property cached

EvaluationFactory dataclass

directed_adjacency_list: dict[int, list[int]] property cached

processed_gs_titles: list[str] property cached

processed_qgs_titles: list[str] property cached

studies_dict: dict[int, Study] property cached

undirected_adjacency_list: dict[int, list[int]] property cached

evaluate(scopus_results)

get_gs_in_bsb(gs_in_scopus)

get_gs_in_sb(gs_in_scopus)

get_gs_in_scopus(processed_scopus_titles)

get_qgs_in_scopus(processed_scopus_titles)

Study dataclass

processed_title property cached

get_directed_adjacency_list_from_gs(gs)

process_title(string)

similarity_score(small_set, other_set)

`Evaluation` `dataclass`

`bsb_recall: float` `property` `cached`

`sb_recall: float` `property` `cached`

`start_set_f1_score: float` `property` `cached`

`start_set_precision: float` `property` `cached`

`start_set_recall: float` `property` `cached`

`EvaluationFactory` `dataclass`

`directed_adjacency_list: dict[int, list[int]]` `property` `cached`

`processed_gs_titles: list[str]` `property` `cached`

`processed_qgs_titles: list[str]` `property` `cached`

`studies_dict: dict[int, Study]` `property` `cached`

`undirected_adjacency_list: dict[int, list[int]]` `property` `cached`

`evaluate(scopus_results)`

`get_gs_in_bsb(gs_in_scopus)`

`get_gs_in_sb(gs_in_scopus)`

`get_gs_in_scopus(processed_scopus_titles)`

`get_qgs_in_scopus(processed_scopus_titles)`

`Study` `dataclass`

`processed_title` `property` `cached`

`get_directed_adjacency_list_from_gs(gs)`

`process_title(string)`

`similarity_score(small_set, other_set)`