Skip to content

Instantly share code, notes, and snippets.

@Glimmerwave
Glimmerwave / miner_diloco.py
Created January 7, 2026 15:11
Distributed training strategy submission
import math
import torch
import torch.nn.utils as nn_utils
import torch.distributed as dist
from copy import deepcopy
from dataclasses import dataclass
from torch.optim.lr_scheduler import LambdaLR
from typing import List, Type, Union, Optional, Dict, Any
from abc import ABC, abstractmethod
@Glimmerwave
Glimmerwave / miner_diloco.py
Created January 7, 2026 08:40
Distributed training strategy submission
import math
import torch
import torch.nn.utils as nn_utils
import torch.distributed as dist
from copy import deepcopy
from dataclasses import dataclass
from torch.optim.lr_scheduler import LambdaLR
from typing import List, Type, Union, Optional, Dict, Any
from abc import ABC, abstractmethod