trainer-kit/config.py at main · matheothedev/trainer-kit · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
"""
Configuration management for Decloud Trainer
"""
import os
import json
from pathlib import Path
from typing import Optional, List, Dict, Any

# Paths
HOME_DIR = Path.home()
CONFIG_DIR = HOME_DIR / ".decloud-trainer"
CONFIG_FILE = CONFIG_DIR / "config.json"
CACHE_DIR = CONFIG_DIR / "cache"
MODELS_CACHE = CACHE_DIR / "models"
GRADIENTS_DIR = CONFIG_DIR / "gradients"

# Solana
PROGRAM_ID = "DCLDgP6xHuVmcKuGvAzKEkrbSYHApp9568JhVoXsF2Hh"
TREASURY = "FzuCxi65QyFXAGbHcXB28RXqyBZSZ5KXLQxeofx1P9K2"

# RPC Endpoints
RPC_ENDPOINTS = {
    "devnet": "https://api.devnet.solana.com",
    "mainnet": "https://api.mainnet-beta.solana.com",
    "testnet": "https://api.testnet.solana.com",
}

# WebSocket endpoints
WS_ENDPOINTS = {
    "devnet": "wss://api.devnet.solana.com",
    "mainnet": "wss://api.mainnet-beta.solana.com",
    "testnet": "wss://api.testnet.solana.com",
}

# IPFS Gateways for reading (Lighthouse primary)
IPFS_GATEWAYS = [
    "https://gateway.lighthouse.storage/ipfs/",
    "https://ipfs.io/ipfs/",
    "https://cloudflare-ipfs.com/ipfs/",
    "https://dweb.link/ipfs/",
]

# Dataset enum mapping (must match contract)
DATASETS = {
    "Cifar10": 0, "Cifar100": 1, "Mnist": 2, "FashionMnist": 3, "Emnist": 4,
    "Kmnist": 5, "Food101": 6, "Flowers102": 7, "StanfordDogs": 8, "StanfordCars": 9,
    "OxfordPets": 10, "CatsVsDogs": 11, "Eurosat": 12, "Svhn": 13, "Caltech101": 14,
    "Caltech256": 15, "Imdb": 16, "Sst2": 17, "Sst5": 18, "YelpReviews": 19,
    "AmazonPolarity": 20, "RottenTomatoes": 21, "FinancialSentiment": 22, "TweetSentiment": 23,
    "AgNews": 24, "Dbpedia": 25, "YahooAnswers": 26, "TwentyNewsgroups": 27,
    "SmsSpam": 28, "HateSpeech": 29, "CivilComments": 30, "Toxicity": 31,
    "ClincIntent": 32, "Banking77": 33, "SnipsIntent": 34, "Conll2003": 35,
    "Wnut17": 36, "Squad": 37, "SquadV2": 38, "TriviaQa": 39, "BoolQ": 40,
    "CommonsenseQa": 41, "Stsb": 42, "Mrpc": 43, "Qqp": 44, "Snli": 45,
    "Mnli": 46, "CnnDailymail": 47, "Xsum": 48, "Samsum": 49, "SpeechCommands": 50,
    "Librispeech": 51, "CommonVoice": 52, "Gtzan": 53, "Esc50": 54, "Urbansound8k": 55,
    "Nsynth": 56, "Ravdess": 57, "CremaD": 58, "Iemocap": 59, "Iris": 60,
    "Wine": 61, "Diabetes": 62, "BreastCancer": 63, "CaliforniaHousing": 64,
    "AdultIncome": 65, "BankMarketing": 66, "CreditDefault": 67, "Titanic": 68,
    "HeartDisease": 69, "ChestXray": 70, "SkinCancer": 71, "DiabeticRetinopathy": 72,
    "BrainTumor": 73, "Malaria": 74, "BloodCells": 75, "CovidXray": 76,
    "PubmedQa": 77, "MedQa": 78, "Electricity": 79, "Weather": 80, "StockPrices": 81,
    "EcgHeartbeat": 82, "CodeSearchNet": 83, "Humaneval": 84, "Mbpp": 85,
    "Spider": 86, "Cora": 87, "Citeseer": 88, "Qm9": 89, "NslKdd": 90,
    "CreditCardFraud": 91, "Phishing": 92, "Movielens1m": 93, "Movielens100k": 94,
    "Xnli": 95, "AmazonReviewsMulti": 96, "Sberquad": 97,
    # Reasoning & Logic
    "Gsm8k": 98, "Arc": 99, "HellaSwag": 100, "WinoGrande": 101, "Piqa": 102,
    # Knowledge & Factuality
    "TruthfulQa": 103, "Mmlu": 104, "NaturalQuestions": 105, "OpenBookQa": 106,
    # Code Generation
    "CodeXGlue": 107, "Ds1000": 108,
    # Translation
    "Wmt14": 109, "Opus100": 110, "Flores": 111,
    # Safety & Toxicity
    "ToxiGen": 112, "RealToxicityPrompts": 113, "HateSpeech18": 114,
    # Dialog
    "MultiWoz": 115, "PersonaChat": 116, "DailyDialog": 117,
    # Instruction Following
    "AlpacaEval": 118, "Flan": 119, "SuperNaturalInstructions": 120,
    # Multilingual
    "PawsX": 121, "TydiQa": 122, "Xcopa": 123,
    # Long Context
    "Scrolls": 124, "Quality": 125, "NarrativeQa": 126,
}

DATASET_ID_TO_NAME = {v: k for k, v in DATASETS.items()}


class Config:
    """Trainer configuration"""

    def __init__(self):
        # Wallet
        self.private_key: Optional[str] = None
        self.network: str = "mainnet"
        self.custom_rpc: Optional[str] = None  # Custom RPC URL (overrides network default)

        # Lighthouse Storage (IPFS)
        self.lighthouse_api_key: Optional[str] = None

        # Training settings
        self.min_reward: float = 0.01  # Minimum reward in SOL to participate
        self.max_concurrent_training: int = 1
        self.training_epochs: int = 5
        self.training_batch_size: int = 32
        self.learning_rate: float = 0.001

        # Dataset paths mapping: dataset_name -> local_path
        self.dataset_paths: Dict[str, str] = {}

        # LLM support
        self.allow_llm: bool = True

        # Privacy: noise added to weights before submission
        self.noise_scale: float = 0.001  # 0.1% noise - small but protective
        self.noise_enabled: bool = True

        # Auto mode
        self.auto_train: bool = True
        self.poll_interval: int = 30

        self._ensure_dirs()
        self._load()

    def _ensure_dirs(self):
        """Create necessary directories"""
        CONFIG_DIR.mkdir(parents=True, exist_ok=True)
        CACHE_DIR.mkdir(parents=True, exist_ok=True)
        MODELS_CACHE.mkdir(parents=True, exist_ok=True)
        GRADIENTS_DIR.mkdir(parents=True, exist_ok=True)

    def _load(self):
        """Load config from file"""
        if CONFIG_FILE.exists():
            with open(CONFIG_FILE, "r") as f:
                data = json.load(f)
                self.private_key = data.get("private_key")
                self.network = data.get("network", "devnet")
                self.custom_rpc = data.get("custom_rpc")
                self.lighthouse_api_key = data.get("lighthouse_api_key")
                self.min_reward = data.get("min_reward", 0.01)
                self.max_concurrent_training = data.get("max_concurrent_training", 1)
                self.training_epochs = data.get("training_epochs", 5)
                self.training_batch_size = data.get("training_batch_size", 32)
                self.learning_rate = data.get("learning_rate", 0.001)
                self.dataset_paths = data.get("dataset_paths", {})
                self.allow_llm = data.get("allow_llm", True)
                self.auto_train = data.get("auto_train", True)
                self.noise_scale = data.get("noise_scale", 0.001)
                self.noise_enabled = data.get("noise_enabled", True)

    def save(self):
        """Save config to file"""
        data = {
            "private_key": self.private_key,
            "network": self.network,
            "custom_rpc": self.custom_rpc,
            "lighthouse_api_key": self.lighthouse_api_key,
            "min_reward": self.min_reward,
            "max_concurrent_training": self.max_concurrent_training,
            "training_epochs": self.training_epochs,
            "training_batch_size": self.training_batch_size,
            "learning_rate": self.learning_rate,
            "dataset_paths": self.dataset_paths,
            "allow_llm": self.allow_llm,
            "auto_train": self.auto_train,
            "noise_scale": self.noise_scale,
            "noise_enabled": self.noise_enabled,
        }
        with open(CONFIG_FILE, "w") as f:
            json.dump(data, f, indent=2)

    @property
    def rpc_url(self) -> str:
        if self.custom_rpc:
            return self.custom_rpc
        return RPC_ENDPOINTS.get(self.network, RPC_ENDPOINTS["devnet"])

    @property
    def ws_url(self) -> str:
        return WS_ENDPOINTS.get(self.network, WS_ENDPOINTS["devnet"])

    def has_lighthouse(self) -> bool:
        """Check if Lighthouse is configured"""
        return bool(self.lighthouse_api_key)

    def get_dataset_path(self, dataset_name: str) -> Optional[str]:
        """Get local path for dataset"""
        return self.dataset_paths.get(dataset_name)

    def set_dataset_path(self, dataset_name: str, path: str):
        """Set local path for dataset"""
        self.dataset_paths[dataset_name] = path
        self.save()

    def remove_dataset_path(self, dataset_name: str):
        """Remove dataset path mapping"""
        if dataset_name in self.dataset_paths:
            del self.dataset_paths[dataset_name]
            self.save()

    def can_train(self, dataset_name: str) -> bool:
        """Check if we can train on this dataset"""
        return dataset_name in self.dataset_paths


# Global config instance
config = Config()