Suggestion for Wandb

Hello, 
I find that the Wandb server is pretty unstable right now, therefore, I suggest that Swanlab is a good substitution for Wandb. (Especially for the Chinese User). I install this lib and modified some content in wandb_recorder.py as follow:
```
from collections.abc import Mapping
from typing import Any

import jax.tree_util as jtu
import numpy as np
import pandas as pd
import wandb
# -----Here-----
import swanlab 
# -----Here-----

from .recorder import Recorder


class WandbRecorder(Recorder):
    """Recorder for Weights & Biases."""

    def __init__(self, *, project, name, config, tags, path, **wandb_kwargs):
        self.wandb_kwargs = {
            "project": project,
            "name": name,
            "config": config,
            "tags": tags,
            "dir": path,
            **wandb_kwargs,
        }

    def init(self) -> None:
        wandb.init(**self.wandb_kwargs)
# -----Here-----
        swanlab.init(**self.wandb_kwargs)
        swanlab.sync_wandb()
# -----Here-----

    def write(self, data: Mapping[str, Any], step: int | None = None) -> None:
        data = jtu.tree_map(lambda x: _convert_data(x), data)
        wandb.log(data, step=step)
        swanlab.log(data, step=step)

    def close(self):
        wandb.finish()
# -----Here-----
        swanlab.finish()
# -----Here-----


def _convert_data(val: Any):
    if isinstance(val, pd.Series):
        return wandb.Histogram(val)
    elif isinstance(val, pd.DataFrame):
        return wandb.Table(dataframe=val)
    else:
        return val


def add_prefix(data: dict, prefix: str):
    """Add prefix to the keys of a dictionary."""
    return {f"{prefix}/{k}": v for k, v in data.items()}


def get_1d_array_statistics(data, histogram=False):
    """Get raw value and statistics of a 1D array.

    Helper function for logging in WandB.

    Args:
        data: 1D numpy array. If data has multiple dimensions, it will be viewed as flattened.
        histogram: If True, return raw data in `pd.Series`, which will be futher converted to histogram in `WandBRecorder`.

    Returns:
        A dictionary containing min, max, mean, and optional raw data.
    """
    if data is None:
        res = dict(min=None, max=None, mean=None)
        if histogram:
            res["val"] = pd.Series()
        return res

    res = dict(
        min=np.nanmin(data).tolist(),
        max=np.nanmax(data).tolist(),
        mean=np.nanmean(data).tolist(),
    )

    if histogram:
        res["val"] = pd.Series(data)

    return res


def get_1d_array(data):
    """Get statistics of a 1D array.

    Similar to `get_1d_array_statistics`, but instead of recording histogram, WandB will record the raw data.
    """
    if data is None:
        res = dict(min=None, max=None, mean=None, val=[])
        return res

    res = dict(
        min=np.nanmin(data).tolist(),
        max=np.nanmax(data).tolist(),
        mean=np.nanmean(data).tolist(),
    )

    res["val"] = data

    return res

```

It would facilitate user to log their training record with this tiny change




Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Suggestion for Wandb #13

Metadata

Assignees

Labels

Type

Projects

Milestone

Relationships

Development

Suggestion for Wandb #13

Description

Metadata

Metadata

Assignees

Labels

Type

Projects

Milestone

Relationships

Development

Issue actions