metaopt · Benjamin-eecs · Oct 11, 2022 · Sep 16, 2022 · Sep 20, 2022 · Sep 21, 2022
diff --git a/.pylintrc b/.pylintrc
@@ -444,7 +444,7 @@ indent-after-paren=4
 indent-string='    '
 
 # Maximum number of characters on a single line.
-max-line-length=100
+max-line-length=120
 
 # Maximum number of lines in a module.
 max-module-lines=1000

diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -13,6 +13,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 
 ### Added
 
+- Add zero-order gradient estimation by [@JieRen98](https://github.com/JieRen98) in [#93](https://github.com/metaopt/torchopt/pull/93).
 - Add RPC-based distributed training support and add distributed MAML example by [@XuehaiPan](https://github.com/XuehaiPan) in [#83](https://github.com/metaopt/torchopt/pull/83).
 - Add full type hints by [@XuehaiPan](https://github.com/XuehaiPan) in [#92](https://github.com/metaopt/torchopt/pull/92).
 - Add API documentation and tutorial for implicit gradients by [@Benjamin-eecs](https://github.com/Benjamin-eecs) and [@JieRen98](https://github.com/JieRen98) and [@XuehaiPan](https://github.com/XuehaiPan) in [#73](https://github.com/metaopt/torchopt/pull/73).

diff --git a/pyproject.toml b/pyproject.toml
@@ -174,6 +174,7 @@ target-version = ["py37", "py38", "py39", "py310"]
 atomic = true
 profile = "black"
 src_paths = ["torchopt", "examples", "tests"]
+extra_standard_library = ["typing_extensions"]
 indent = 4
 line_length = 100
 lines_after_imports = 2

diff --git a/torchopt/__init__.py b/torchopt/__init__.py
@@ -26,6 +26,7 @@
     schedule,
     typing,
     visual,
+    zero_order_diff,
 )
 from torchopt.accelerated_op import is_available as accelerated_op_available
 from torchopt.alias import adam, adamw, rmsprop, sgd

diff --git a/torchopt/accelerated_op/adam_op.py b/torchopt/accelerated_op/adam_op.py
@@ -31,7 +31,6 @@ class MuOp(torch.autograd.Function):  # pylint: disable=abstract-method
 
         @staticmethod
         def jvp(ctx: Any, *grad_inputs: Any) -> Any:
-            # pylint: disable-next=line-too-long
             """Defines a formula for differentiating the operation with forward mode automatic differentiation."""
 
         @staticmethod
@@ -58,7 +57,6 @@ class NuOp(torch.autograd.Function):  # pylint: disable=abstract-method
 
         @staticmethod
         def jvp(ctx: Any, *grad_inputs: Any) -> Any:
-            # pylint: disable-next=line-too-long
             """Defines a formula for differentiating the operation with forward mode automatic differentiation."""
 
         @staticmethod
@@ -85,7 +83,6 @@ class UpdatesOp(torch.autograd.Function):  # pylint: disable=abstract-method
 
         @staticmethod
         def jvp(ctx: Any, *grad_inputs: Any) -> Any:
-            # pylint: disable-next=line-too-long
             """Defines a formula for differentiating the operation with forward mode automatic differentiation."""
 
         @staticmethod

diff --git a/torchopt/alias.py b/torchopt/alias.py
@@ -130,7 +130,7 @@ def _scale_by_neg_lr(lr: ScalarOrSchedule):
     if callable(lr):
 
         def schedule_wrapper(count):
-            return -lr(count)
+            return -lr(count)  # type: ignore[operator]
 
         # pylint: disable-next=protected-access
         return transform._scale_by_schedule(schedule_wrapper, already_flattened=True)

diff --git a/torchopt/base.py b/torchopt/base.py
@@ -34,12 +34,7 @@
 import itertools
 from abc import abstractmethod
 from typing import TYPE_CHECKING, Callable, NamedTuple, Optional, Tuple
-
-
-try:
-    from typing import Protocol  # pylint: disable=unused-import
-except ImportError:
-    from typing_extensions import Protocol  # type: ignore[assignment]
+from typing_extensions import Protocol  # Python 3.8+
 
 
 if TYPE_CHECKING:
@@ -229,7 +224,7 @@ def __new__(cls):
     @staticmethod
     def init_fn(params: 'Params') -> 'OptState':  # pylint: disable=unused-argument
         """Returns empty state."""
-        return EmptyState()
+        return EmptyState()  # type: ignore[return-value]
 
     @staticmethod
     def update_fn(

diff --git a/torchopt/distributed/api.py b/torchopt/distributed/api.py
@@ -35,7 +35,7 @@
 
 import torchopt.pytree as pytree
 from torchopt.distributed.world import get_worker_id, get_world_rank, get_world_size
-from torchopt.typing import Future, PyTree
+from torchopt.typing import Future
 
 
 __all__ = [
@@ -116,11 +116,12 @@ def __call__(
             workers = list(map(get_worker_id, self.workers))
         num_workers = len(workers)
 
-        args_tree = cast(PyTree[Any], (args, kwargs))
-        flattened_args, treedef = pytree.tree_flatten(args_tree)
+        args_tree = (args, kwargs)
+        flat_args: List[Any]
+        flat_args, treedef = pytree.tree_flatten(args_tree)  # type: ignore[arg-type]
 
         batch_size = None
-        for arg in flattened_args:
+        for arg in flat_args:
             if isinstance(arg, torch.Tensor):
                 if batch_size is None:
                     batch_size = arg.shape[self.dim]
@@ -134,7 +135,6 @@ def __call__(
             return [(get_world_rank(), args, kwargs.copy())]
 
         dim_slices: List[Union[int, slice]]
-        # pylint: disable-next=line-too-long
         batch_slices: List[Tuple[Union[int, slice, Ellipsis.__class__], ...]]  # type: ignore[name-defined]
         if self.exclusive:
             num_replicas = batch_size
@@ -169,18 +169,18 @@ def __call__(
                 for dim_slice in dim_slices
             ]
 
-        flattened_args_replicas: List[List[Any]] = [[] for _ in range(num_replicas)]
-        for arg in flattened_args:
+        flat_args_replicas: List[List[Any]] = [[] for _ in range(num_replicas)]
+        for arg in flat_args:
             if isinstance(arg, torch.Tensor):
                 for i, batch_slice in enumerate(batch_slices):
-                    flattened_args_replicas[i].append(arg[batch_slice])
+                    flat_args_replicas[i].append(arg[batch_slice])
             else:
                 for i in range(num_replicas):
-                    flattened_args_replicas[i].append(arg)
+                    flat_args_replicas[i].append(arg)
 
         args_replicas: List[Tuple[Args, KwArgs]] = [
             pytree.tree_unflatten(treedef, args_replica)  # type: ignore[misc]
-            for args_replica in flattened_args_replicas
+            for args_replica in flat_args_replicas
         ]
 
         return [
@@ -237,8 +237,6 @@ def dim_partitioner(
     return TensorDimensionPartitioner(dim, exclusive=exclusive, keepdim=keepdim, workers=workers)
 
 
-# fmt: off
-# pylint: disable=line-too-long
 batch_partitioner: PartitionFunction = dim_partitioner(dim=0, keepdim=True, exclusive=False)
 """Partitioner for batch dimension. Divide and replicates the arguments to all workers along the first dimension.
 
@@ -249,16 +247,14 @@ def dim_partitioner(
 All tensors in the ``args`` and ``kwargs`` will be partitioned along the dimension ``dim``,
 while the non-tensor values will be broadcasted to partitions.
 """
-exclusive_batch_partitioner: PartitionFunction = dim_partitioner(dim=0, keepdim=True, exclusive=True)
+exclusive_batch_partitioner: PartitionFunction = dim_partitioner(dim=0, keepdim=True, exclusive=True)  # fmt: skip
 """Partitioner for batch dimension. Divide and replicates the arguments to all workers along the first dimension.
 
 Each batch sample will be assigned to a separate RPC call.
 
 All tensors in the ``args`` and ``kwargs`` will be partitioned along the dimension ``dim``,
 while the non-tensor values will be broadcasted to partitions.
 """
-# pylint: enable=line-too-long
-# fmt: on
 
 
 def mean_reducer(results: Iterable[torch.Tensor]) -> torch.Tensor:
@@ -280,7 +276,6 @@ def remote_async_call(
     reducer: Optional[Callable[[Iterable[T]], U]] = None,
     timeout: Optional[float] = UNSET_RPC_TIMEOUT,
 ) -> Union[Future[List[T]], Future[U]]:
-    # pylint: disable=line-too-long
     """Asynchronously do an RPC on remote workers and return the a :class:`torch.Future` instance at the current worker.
 
     Args: