Skip to content

Instantly share code, notes, and snippets.

5Cw9kWG4YVapVuXekuGUH1mzGFZg4jjw7Q1UcLaGwc57xm3e
5Hot6fAxKzarjuFu6jvSiCCcNP9tp61gc4JS5cdiSRWdqeaW
5C7NvbmpfR3956shdAdV1ASbsbezANiA7sB4H5PBtUyMjUiz
5FjP8fFbMb6pEHfRZyRegsmwRUMDuLFNcaBu1TerWMPEKgNh
5Evsh6VqUEE53FMBAg6LCeXPA9RJw7PYdKfFKEfaYezT2Uv1
5GmsXK1D5uVFgmpQdQYveDQMu7fdq4Dp1N8rvakkEPJSqbDB
5GKHLgHnp1wdXTB1krScJMhrjqwn2XGv239XfMqSx5c2xXU8
5FFBe3jLgTGsoZy9CSXQ7HFntMcgQMeC1cckX4oMCXcbn3JR
5GHNXTKu5ERKvGi3VB4DUuLTqfZuSA8gQ11W3hm59eRZsoNn
5EbiJVEou3PFSYU7r8x8njcG38MNav6dC6TQZiZeKCoNxYUr
@zvnt
zvnt / miner_diloco.py
Created December 26, 2025 02:14
Distributed training strategy submission
import math
import torch
import torch.nn.utils as nn_utils
import torch.distributed as dist
from copy import deepcopy
from dataclasses import dataclass
from torch.optim.lr_scheduler import LambdaLR
from typing import List, Type, Union, Optional, Dict, Any
from abc import ABC, abstractmethod