Skip to content
Snippets Groups Projects
Commit fcc154c6 authored by Tim Tobias Bauerle's avatar Tim Tobias Bauerle
Browse files

experiment setups

parent b43bdda4
Branches
No related tags found
1 merge request!22Fix lr schedule
deduction_per_second: 0.02
deduction_per_mflop: 0.00000005
deduction_per_mbyte_received: 0.0002
deduction_per_mbyte_sent: 0.0002
devices: [
{
device_id: "d0",
address: "localhost:50051",
battery_capacity: 1000000,
torch_device: cuda:0
},
{
device_id: "d1",
address: "localhost:50052",
battery_capacity: 1000000,
torch_device: cuda:1
},
{
device_id: "d2",
address: "localhost:50053",
battery_capacity: 1000000,
torch_device: cuda:2
},
{
device_id: "d3",
address: "localhost:50054",
battery_capacity: 1000000,
torch_device: cuda:0
},
{
device_id: "d4",
address: "localhost:50055",
battery_capacity: 1000000,
torch_device: cuda:1
},
{
device_id: "d5",
address: "localhost:50056",
battery_capacity: 1000000,
torch_device: cuda:2
},
{
device_id: "d6",
address: "localhost:50057",
battery_capacity: 1000000,
torch_device: cuda:0
},
{
device_id: "d7",
address: "localhost:50058",
battery_capacity: 1000000,
torch_device: cuda:1
},
{
device_id: "d8",
address: "localhost:50059",
battery_capacity: 1000000,
torch_device: cuda:2
},
{
device_id: "d9",
address: "localhost:50060",
battery_capacity: 1000000,
torch_device: cuda:0
}
]
devices: [
{
device_id: "d0",
address: "localhost:50051",
battery_capacity: 400,
},
{
device_id: "d1",
address: "localhost:50052",
battery_capacity: 400
},
{
device_id: "d2",
address: "localhost:50053",
battery_capacity: 300
},
{
device_id: "d3",
address: "localhost:50054",
battery_capacity: 200
},
{
device_id: "d4",
address: "localhost:50055",
battery_capacity: 200
}
]
...@@ -298,7 +298,9 @@ class DeviceServer: ...@@ -298,7 +298,9 @@ class DeviceServer:
print( print(
f"\n{Fore.RED}ADAPTIVE TRESHOLD REACHED, NEXT BATCH\n{Fore.RESET}" f"\n{Fore.RED}ADAPTIVE TRESHOLD REACHED, NEXT BATCH\n{Fore.RESET}"
) )
self.node_device.log({"adaptive_learning_threshold_applied": True}) self.node_device.log(
{"adaptive_learning_threshold_applied": server_gradients.size(0)}
)
continue continue
num_client_gradients = len(client_forward_pass_responses) num_client_gradients = len(client_forward_pass_responses)
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Please register or to comment