139 lines
4.3 KiB
Java
139 lines
4.3 KiB
Java
/*******************************************************************************
|
|
* Copyright (c) 2015-2018 Skymind, Inc.
|
|
*
|
|
* This program and the accompanying materials are made available under the
|
|
* terms of the Apache License, Version 2.0 which is available at
|
|
* https://www.apache.org/licenses/LICENSE-2.0.
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
|
|
* WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
|
|
* License for the specific language governing permissions and limitations
|
|
* under the License.
|
|
*
|
|
* SPDX-License-Identifier: Apache-2.0
|
|
******************************************************************************/
|
|
|
|
package org.deeplearning4j.arbiter.layers;
|
|
|
|
import lombok.AccessLevel;
|
|
import lombok.Data;
|
|
import lombok.EqualsAndHashCode;
|
|
import lombok.NoArgsConstructor;
|
|
import org.deeplearning4j.arbiter.dropout.DropoutSpace;
|
|
import org.deeplearning4j.arbiter.optimize.api.AbstractParameterSpace;
|
|
import org.deeplearning4j.arbiter.optimize.api.ParameterSpace;
|
|
import org.deeplearning4j.arbiter.optimize.parameter.FixedValue;
|
|
import org.deeplearning4j.nn.conf.dropout.IDropout;
|
|
import org.deeplearning4j.nn.conf.layers.Layer;
|
|
import org.nd4j.shade.jackson.annotation.JsonInclude;
|
|
|
|
import java.util.ArrayList;
|
|
import java.util.LinkedList;
|
|
import java.util.List;
|
|
import java.util.Map;
|
|
|
|
/**
|
|
* LayerSpace contains common Layer hyperparameters; should match {@link Layer} in terms of features
|
|
*
|
|
* @author Alex Black
|
|
*/
|
|
@JsonInclude(JsonInclude.Include.NON_NULL)
|
|
@Data
|
|
@EqualsAndHashCode(callSuper = false)
|
|
@NoArgsConstructor(access = AccessLevel.PROTECTED) //For Jackson JSON/YAML deserialization
|
|
public abstract class LayerSpace<L extends Layer> extends AbstractParameterSpace<L> {
|
|
protected ParameterSpace<IDropout> dropOut;
|
|
protected int numParameters;
|
|
|
|
protected LayerSpace(Builder builder) {
|
|
this.dropOut = builder.dropOut;
|
|
}
|
|
|
|
@Override
|
|
public List<ParameterSpace> collectLeaves() {
|
|
//To avoid manually coding EVERY parameter, in every layer:
|
|
// Do a depth-first search of nested spaces
|
|
LinkedList<ParameterSpace> stack = new LinkedList<>();
|
|
stack.add(this);
|
|
|
|
List<ParameterSpace> out = new ArrayList<>();
|
|
while (!stack.isEmpty()) {
|
|
ParameterSpace next = stack.removeLast();
|
|
if (next.isLeaf()) {
|
|
out.add(next);
|
|
} else {
|
|
Map<String, ParameterSpace> m = next.getNestedSpaces();
|
|
ParameterSpace[] arr = m.values().toArray(new ParameterSpace[m.size()]);
|
|
for (int i = arr.length - 1; i >= 0; i--) {
|
|
stack.add(arr[i]);
|
|
}
|
|
}
|
|
}
|
|
|
|
return out;
|
|
}
|
|
|
|
@Override
|
|
public int numParameters() {
|
|
return numParameters;
|
|
}
|
|
|
|
@Override
|
|
public boolean isLeaf() {
|
|
return false;
|
|
}
|
|
|
|
@Override
|
|
public void setIndices(int... indices) {
|
|
throw new UnsupportedOperationException("Cannot set indices for non-leaf parameter space");
|
|
}
|
|
|
|
|
|
protected void setLayerOptionsBuilder(Layer.Builder builder, double[] values) {
|
|
if (dropOut != null)
|
|
builder.dropOut(dropOut.getValue(values));
|
|
}
|
|
|
|
|
|
@Override
|
|
public String toString() {
|
|
return toString(", ");
|
|
}
|
|
|
|
protected String toString(String delim) {
|
|
StringBuilder sb = new StringBuilder();
|
|
if (dropOut != null)
|
|
sb.append("dropOut: ").append(dropOut).append(delim);
|
|
String s = sb.toString();
|
|
|
|
if (s.endsWith(delim)) {
|
|
//Remove final delimiter
|
|
int last = s.lastIndexOf(delim);
|
|
return s.substring(0, last);
|
|
} else
|
|
return s;
|
|
}
|
|
|
|
@SuppressWarnings("unchecked")
|
|
public abstract static class Builder<T> {
|
|
protected ParameterSpace<IDropout> dropOut;
|
|
|
|
public T dropOut(double dropOut) {
|
|
return dropOut(new FixedValue<>(dropOut));
|
|
}
|
|
|
|
public T dropOut(ParameterSpace<Double> dropOut) {
|
|
return iDropOut(new DropoutSpace(dropOut));
|
|
}
|
|
|
|
public T iDropOut(ParameterSpace<IDropout> dropOut){
|
|
this.dropOut = dropOut;
|
|
return (T) this;
|
|
}
|
|
|
|
public abstract <E extends LayerSpace> E build();
|
|
}
|
|
|
|
}
|