-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathpyproject.toml
73 lines (65 loc) · 2.08 KB
/
pyproject.toml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
[build-system]
requires = ["hatchling"]
build-backend = "hatchling.build"
[project]
name = "flowertune-med"
version = "1.0.0"
description = ""
license = "Apache-2.0"
dependencies = [
"flwr[simulation]>=1.12.0",
"flwr-datasets>=0.3.0",
"trl==0.8.1",
"bitsandbytes==0.43.0",
"scipy==1.13.0",
"peft==0.6.2",
"transformers==4.43.1",
"sentencepiece==0.2.0",
"omegaconf==2.3.0",
"hf_transfer==0.1.8",
]
[tool.hatch.build.targets.wheel]
packages = ["."]
[tool.flwr.app]
publisher = "mrs83"
[tool.flwr.app.components]
serverapp = "flowertune_med.server_app:app"
clientapp = "flowertune_med.client_app:app"
[tool.flwr.app.config]
model.name = "mistralai/Mistral-7B-Instruct-v0.3"
model.quantization = 4
model.gradient-checkpointing = true
model.lora.peft-lora-r = 8
model.lora.peft-lora-alpha = 32
train.save-every-round = 5
train.learning-rate-max = 5e-5
train.learning-rate-min = 1e-6
train.seq-length = 512
train.training-arguments.output-dir = ""
train.training-arguments.learning-rate = ""
train.training-arguments.per-device-train-batch-size = 16
train.training-arguments.gradient-accumulation-steps = 1
train.training-arguments.logging-steps = 1
train.training-arguments.num-train-epochs = 3
train.training-arguments.max-steps = 6
train.training-arguments.warmup-steps = 2
train.training-arguments.save-steps = 1000
train.training-arguments.save-total-limit = 10
train.training-arguments.max-grad-norm = 1.0
train.training-arguments.gradient-checkpointing = true
train.training-arguments.lr-scheduler-type = "constant_with_warmup"
train.training-arguments.fp16 = false
train.training-arguments.bf16 = true
train.training-arguments.tf32 = true
train.training-arguments.optim = "paged_adamw_8bit"
strategy.fraction-fit = 0.15
strategy.fraction-evaluate = 0.0
num-server-rounds = 100
[tool.flwr.app.config.static]
dataset.name = "medalpaca/medical_meadow_medical_flashcards"
[tool.flwr.federations]
default = "local-simulation"
[tool.flwr.federations.local-simulation]
options.num-supernodes = 20
options.backend.client-resources.num-cpus = 6
options.backend.client-resources.num-gpus = 1.0