2021-02-01 14:31:20 +09:00
|
|
|
/*
|
|
|
|
|
* ******************************************************************************
|
|
|
|
|
* *
|
|
|
|
|
* *
|
|
|
|
|
* * This program and the accompanying materials are made available under the
|
|
|
|
|
* * terms of the Apache License, Version 2.0 which is available at
|
|
|
|
|
* * https://www.apache.org/licenses/LICENSE-2.0.
|
|
|
|
|
* *
|
2021-02-01 17:47:29 +09:00
|
|
|
* * See the NOTICE file distributed with this work for additional
|
|
|
|
|
* * information regarding copyright ownership.
|
2021-02-01 14:31:20 +09:00
|
|
|
* * Unless required by applicable law or agreed to in writing, software
|
|
|
|
|
* * distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
|
|
|
|
|
* * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
|
|
|
|
|
* * License for the specific language governing permissions and limitations
|
|
|
|
|
* * under the License.
|
|
|
|
|
* *
|
|
|
|
|
* * SPDX-License-Identifier: Apache-2.0
|
|
|
|
|
* *****************************************************************************
|
|
|
|
|
*/
|
2019-06-06 15:21:15 +03:00
|
|
|
|
|
|
|
|
package org.deeplearning4j.optimize.listeners;
|
|
|
|
|
|
2023-05-08 09:34:44 +02:00
|
|
|
import java.io.Serializable;
|
|
|
|
|
import java.util.List;
|
|
|
|
|
import java.util.Map;
|
|
|
|
|
import java.util.concurrent.atomic.AtomicLong;
|
2019-06-06 15:21:15 +03:00
|
|
|
import lombok.*;
|
|
|
|
|
import lombok.extern.slf4j.Slf4j;
|
2023-03-23 17:39:00 +01:00
|
|
|
import net.brutex.ai.dnn.api.IModel;
|
2019-06-06 15:21:15 +03:00
|
|
|
import org.deeplearning4j.optimize.api.BaseTrainingListener;
|
2020-05-04 15:54:03 +10:00
|
|
|
import org.nd4j.common.util.ThreadUtils;
|
2019-06-06 15:21:15 +03:00
|
|
|
import org.nd4j.linalg.api.ndarray.INDArray;
|
|
|
|
|
|
|
|
|
|
@AllArgsConstructor
|
|
|
|
|
@NoArgsConstructor
|
|
|
|
|
@Data
|
|
|
|
|
@Builder
|
|
|
|
|
@Slf4j
|
|
|
|
|
public class SleepyTrainingListener extends BaseTrainingListener implements Serializable {
|
|
|
|
|
public enum SleepMode {
|
|
|
|
|
/**
|
|
|
|
|
* In this mode parkNanos() call will be used, to make process really idle
|
|
|
|
|
*/
|
|
|
|
|
PARK,
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* In this mode Thread.sleep() call will be used, to make sleep traceable via profiler
|
|
|
|
|
*/
|
|
|
|
|
SLEEP,
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Busy-lock will be used, to guarantee 100% thread use
|
|
|
|
|
*/
|
|
|
|
|
BUSY,
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
public enum TimeMode {
|
|
|
|
|
/**
|
|
|
|
|
* In this mode, listener will be trying to match specified time for a given invocation method.
|
|
|
|
|
* I.e. if iteration sleep is set to 500, and real iteration was 35 ms, thread will be sleeping for 465ms, to match target time of 500ms
|
|
|
|
|
*
|
|
|
|
|
*/
|
|
|
|
|
ADDITIVE,
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* In this mode, listener will just call
|
|
|
|
|
*/
|
|
|
|
|
SIMPLE
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Getter(AccessLevel.NONE)
|
|
|
|
|
@Setter(AccessLevel.NONE)
|
|
|
|
|
protected final transient ThreadLocal<AtomicLong> lastEE = new ThreadLocal<>();
|
|
|
|
|
|
|
|
|
|
@Getter(AccessLevel.NONE)
|
|
|
|
|
@Setter(AccessLevel.NONE)
|
|
|
|
|
protected final transient ThreadLocal<AtomicLong> lastES = new ThreadLocal<>();
|
|
|
|
|
|
|
|
|
|
@Getter(AccessLevel.NONE)
|
|
|
|
|
@Setter(AccessLevel.NONE)
|
|
|
|
|
protected final transient ThreadLocal<AtomicLong> lastFF = new ThreadLocal<>();
|
|
|
|
|
|
|
|
|
|
@Getter(AccessLevel.NONE)
|
|
|
|
|
@Setter(AccessLevel.NONE)
|
|
|
|
|
protected final transient ThreadLocal<AtomicLong> lastBP = new ThreadLocal<>();
|
|
|
|
|
|
|
|
|
|
@Getter(AccessLevel.NONE)
|
|
|
|
|
@Setter(AccessLevel.NONE)
|
|
|
|
|
protected final transient ThreadLocal<AtomicLong> lastIteration = new ThreadLocal<>();
|
|
|
|
|
|
|
|
|
|
@Builder.Default
|
|
|
|
|
protected long timerEE = 0L;
|
|
|
|
|
@Builder.Default
|
|
|
|
|
protected long timerES = 0L;
|
|
|
|
|
@Builder.Default
|
|
|
|
|
protected long timerFF = 0L;
|
|
|
|
|
@Builder.Default
|
|
|
|
|
protected long timerBP = 0L;
|
|
|
|
|
@Builder.Default
|
|
|
|
|
protected long timerIteration = 0L;
|
|
|
|
|
|
|
|
|
|
@Builder.Default
|
|
|
|
|
protected SleepMode sleepMode = SleepMode.PARK;
|
|
|
|
|
|
|
|
|
|
@Builder.Default
|
|
|
|
|
protected TimeMode timeMode = TimeMode.SIMPLE;
|
|
|
|
|
|
|
|
|
|
protected void sleep(long sleepTimeMs) {
|
|
|
|
|
if (sleepTimeMs < 1)
|
|
|
|
|
return;
|
|
|
|
|
|
|
|
|
|
switch (sleepMode) {
|
|
|
|
|
case PARK:
|
|
|
|
|
ThreadUtils.uncheckedSleep(sleepTimeMs);
|
|
|
|
|
break;
|
|
|
|
|
case BUSY: {
|
|
|
|
|
long target = System.currentTimeMillis() + sleepTimeMs;
|
|
|
|
|
while (System.currentTimeMillis() < target) {
|
|
|
|
|
Thread.yield();
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
case SLEEP:
|
|
|
|
|
try {
|
|
|
|
|
Thread.sleep(sleepTimeMs);
|
|
|
|
|
} catch (InterruptedException e) {
|
|
|
|
|
Thread.currentThread().interrupt();
|
|
|
|
|
throw new RuntimeException(e);
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
throw new IllegalStateException("Unknown SleepMode value passed in: " + sleepMode);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
protected void sleep(AtomicLong lastTime, long sleepTime) {
|
|
|
|
|
if (sleepTime == 0)
|
|
|
|
|
return;
|
|
|
|
|
|
|
|
|
|
// if that's SIMPLE mode - just sleep specific time, and go
|
|
|
|
|
if (timeMode == TimeMode.SIMPLE) {
|
|
|
|
|
sleep(sleepTime);
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// we're skipping first iteration here, just sleeping fixed amount of time
|
|
|
|
|
if (lastTime == null) {
|
|
|
|
|
sleep(sleepTime);
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
// getting delta between real cycle time and desired one.
|
|
|
|
|
long currentTime = System.currentTimeMillis();
|
|
|
|
|
long delta = sleepTime - (currentTime - lastTime.get());
|
|
|
|
|
|
|
|
|
|
sleep(delta);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Override
|
2023-03-23 17:39:00 +01:00
|
|
|
public void onEpochStart(IModel model) {
|
2019-06-06 15:21:15 +03:00
|
|
|
sleep(lastES.get(), timerES);
|
|
|
|
|
|
|
|
|
|
if (lastES.get() == null)
|
|
|
|
|
lastES.set(new AtomicLong(System.currentTimeMillis()));
|
|
|
|
|
else
|
|
|
|
|
lastES.get().set(System.currentTimeMillis());
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Override
|
2023-03-23 17:39:00 +01:00
|
|
|
public void onEpochEnd(IModel model) {
|
2019-06-06 15:21:15 +03:00
|
|
|
sleep(lastEE.get(), timerEE);
|
|
|
|
|
|
|
|
|
|
if (lastEE.get() == null)
|
|
|
|
|
lastEE.set(new AtomicLong(System.currentTimeMillis()));
|
|
|
|
|
else
|
|
|
|
|
lastEE.get().set(System.currentTimeMillis());
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Override
|
2023-03-23 17:39:00 +01:00
|
|
|
public void onForwardPass(IModel model, List<INDArray> activations) {
|
2019-06-06 15:21:15 +03:00
|
|
|
sleep(lastFF.get(), timerFF);
|
|
|
|
|
|
|
|
|
|
if (lastFF.get() == null)
|
|
|
|
|
lastFF.set(new AtomicLong(System.currentTimeMillis()));
|
|
|
|
|
else
|
|
|
|
|
lastFF.get().set(System.currentTimeMillis());
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Override
|
2023-03-23 17:39:00 +01:00
|
|
|
public void onForwardPass(IModel model, Map<String, INDArray> activations) {
|
2019-06-06 15:21:15 +03:00
|
|
|
sleep(lastFF.get(), timerFF);
|
|
|
|
|
|
|
|
|
|
if (lastFF.get() == null)
|
|
|
|
|
lastFF.set(new AtomicLong(System.currentTimeMillis()));
|
|
|
|
|
else
|
|
|
|
|
lastFF.get().set(System.currentTimeMillis());
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Override
|
2023-03-23 17:39:00 +01:00
|
|
|
public void iterationDone(IModel model, int iteration, int epoch) {
|
2019-06-06 15:21:15 +03:00
|
|
|
sleep(lastIteration.get(), timerIteration);
|
|
|
|
|
|
|
|
|
|
if (lastIteration.get() == null)
|
|
|
|
|
lastIteration.set(new AtomicLong(System.currentTimeMillis()));
|
|
|
|
|
else
|
|
|
|
|
lastIteration.get().set(System.currentTimeMillis());
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Override
|
2023-03-23 17:39:00 +01:00
|
|
|
public void onBackwardPass(IModel model) {
|
2019-06-06 15:21:15 +03:00
|
|
|
sleep(lastBP.get(), timerBP);
|
|
|
|
|
|
|
|
|
|
if (lastBP.get() == null)
|
|
|
|
|
lastBP.set(new AtomicLong(System.currentTimeMillis()));
|
|
|
|
|
else
|
|
|
|
|
lastBP.get().set(System.currentTimeMillis());
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Override
|
2023-03-23 17:39:00 +01:00
|
|
|
public void onGradientCalculation(IModel model) {
|
2019-06-06 15:21:15 +03:00
|
|
|
//
|
|
|
|
|
}
|
|
|
|
|
}
|