Skip to content

Conflicts

Functions to resolve any git conflicts between notebooks.

DiffJupyterNotebook (DiffModel)

Protocol for mypy static type checking.

cells_equals(diff_cells)

Return if cells in DiffCells are equal.

Source code in databooks/conflicts.py
def cells_equals(diff_cells: Cells[Tuple[List[Cell], List[Cell]]]) -> List[bool]:
    """Return if cells in `DiffCells` are equal."""
    return [cell_first == cell_last for cell_first, cell_last in diff_cells]

conflict2nb(conflict_file, *, keep_first=True, cells_first=None, ignore_none=True, verbose=False)

Merge diffs from conflicts and return valid a notebook.

Parameters:

Name Type Description Default
conflict_file ConflictFile

A databooks.git_utils.ConflictFile with conflicts

required
keep_first bool

Whether to keep the metadata of the first or last notebook

True
cells_first Optional[bool]

Whether to keep the cells of the first or last notebook

None
ignore_none bool

Keep all metadata fields even if it's included in only one notebook

True
verbose bool

Log written files and metadata conflicts

False

Returns:

Type Description
JupyterNotebook

Resolved conflicts as a databooks.data_models.notebook.JupyterNotebook model

Source code in databooks/conflicts.py
def conflict2nb(
    conflict_file: ConflictFile,
    *,
    keep_first: bool = True,
    cells_first: Optional[bool] = None,
    ignore_none: bool = True,
    verbose: bool = False,
) -> JupyterNotebook:
    """
    Merge diffs from conflicts and return valid a notebook.

    :param conflict_file: A `databooks.git_utils.ConflictFile` with conflicts
    :param keep_first: Whether to keep the metadata of the first or last notebook
    :param cells_first: Whether to keep the cells of the first or last notebook
    :param ignore_none: Keep all metadata fields even if it's included in only one
     notebook
    :param verbose: Log written files and metadata conflicts
    :return: Resolved conflicts as a `databooks.data_models.notebook.JupyterNotebook`
     model
    """
    if verbose:
        set_verbose(logger)

    nb_1 = JupyterNotebook.parse_raw(conflict_file.first_contents)
    nb_2 = JupyterNotebook.parse_raw(conflict_file.last_contents)
    if nb_1.metadata != nb_2.metadata:
        msg = (
            f"Notebook metadata conflict for {conflict_file.filename}. Keeping "
            + "first."
            if keep_first
            else "last."
        )
        logger.debug(msg)

    diff_nb = cast(DiffModel, nb_1 - nb_2)
    nb = cast(
        JupyterNotebook,
        diff_nb.resolve(
            ignore_none=ignore_none,
            keep_first=keep_first,
            keep_first_cells=cells_first,
            first_id=conflict_file.first_log,
            last_id=conflict_file.last_log,
        ),
    )
    logger.debug(f"Resolved conflicts in {conflict_file.filename}.")
    return nb

conflicts2nbs(conflict_files, *, progress_callback=<function <lambda> at 0x7fb7573e0dc0>, **conflict2nb_kwargs)

Get notebooks from conflicts.

Wrap databooks.conflicts.conflict2nb to write notebooks to list of databooks.git_utils.ConflictFile.

Parameters:

Name Type Description Default
conflict_files List[ConflictFile]

Files with source conflict files and one-liner git logs

required
progress_callback Callable[[], None]

Callback function to report progress

<function <lambda> at 0x7fb7573e0dc0>
conflict2nb_kwargs Any

Keyword arguments to be passed to databooks.conflicts.conflict2nb

{}

Returns:

Type Description
None
Source code in databooks/conflicts.py
def conflicts2nbs(
    conflict_files: List[ConflictFile],
    *,
    progress_callback: Callable[[], None] = lambda: None,
    **conflict2nb_kwargs: Any,
) -> None:
    """
    Get notebooks from conflicts.

    Wrap `databooks.conflicts.conflict2nb` to write notebooks to list of
     `databooks.git_utils.ConflictFile`.
    :param conflict_files: Files with source conflict files and one-liner git logs
    :param progress_callback: Callback function to report progress
    :param conflict2nb_kwargs: Keyword arguments to be passed to
     `databooks.conflicts.conflict2nb`
    :return:
    """
    for conflict in conflict_files:
        nb = conflict2nb(conflict, **conflict2nb_kwargs)
        write_notebook(nb=nb, path=conflict.filename)
        progress_callback()

path2conflicts(nb_paths, repo=None)

Get the difference model from the path based on the git conflict information.

Parameters:

Name Type Description Default
nb_path

Path to file with conflicts (must be notebook paths)

required

Returns:

Type Description
List[ConflictFile]

Generator of DiffModels, to be resolved

Source code in databooks/conflicts.py
def path2conflicts(
    nb_paths: List[Path], repo: Optional[Repo] = None
) -> List[ConflictFile]:
    """
    Get the difference model from the path based on the git conflict information.

    :param nb_path: Path to file with conflicts (must be notebook paths)
    :return: Generator of `DiffModel`s, to be resolved
    """
    if any(nb_path.suffix not in ("", ".ipynb") for nb_path in nb_paths):
        raise ValueError(
            "Expected either notebook files, a directory or glob expression."
        )
    common_parent = max(set.intersection(*[set(p.parents) for p in nb_paths]))
    repo = get_repo(common_parent) if repo is None else repo
    return [
        file
        for file in get_conflict_blobs(repo=repo)
        if any(file.filename.match(str(p.name)) for p in nb_paths)
    ]
Back to top