2017-03-29 13:44:02 +00:00
|
|
|
## @package layer_model_instantiator
|
|
|
|
|
# Module caffe2.python.layer_model_instantiator
|
2020-09-24 00:55:24 +00:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2016-11-14 22:58:04 +00:00
|
|
|
|
2017-05-25 07:10:48 +00:00
|
|
|
from caffe2.python import core, schema
|
2016-11-14 22:58:04 +00:00
|
|
|
from caffe2.python.layers.layers import InstantiationContext
|
|
|
|
|
from caffe2.python.layers.tags import Tags
|
|
|
|
|
|
|
|
|
|
|
2017-04-17 21:02:44 +00:00
|
|
|
def _filter_layers(layers, include_tags):
|
|
|
|
|
if include_tags is None:
|
|
|
|
|
return layers
|
|
|
|
|
include_tags = set(include_tags)
|
2017-05-30 22:29:57 +00:00
|
|
|
return [l for l in layers if not include_tags.isdisjoint(l.tags)]
|
2017-04-17 21:02:44 +00:00
|
|
|
|
|
|
|
|
|
2017-05-25 07:10:48 +00:00
|
|
|
def shrink_output_schema(net, out_schema):
|
|
|
|
|
if len(out_schema.field_names()) <= 1:
|
|
|
|
|
return out_schema
|
|
|
|
|
exists = [net.BlobIsDefined(blob) for blob in out_schema.field_blobs()]
|
|
|
|
|
return schema.from_column_list(
|
|
|
|
|
[
|
|
|
|
|
col_name for ok, col_name in
|
|
|
|
|
zip(exists, out_schema.field_names()) if ok
|
|
|
|
|
],
|
|
|
|
|
[
|
|
|
|
|
col_type for ok, col_type in
|
|
|
|
|
zip(exists, out_schema.field_types()) if ok
|
|
|
|
|
],
|
|
|
|
|
[
|
|
|
|
|
col_blob for ok, col_blob in
|
|
|
|
|
zip(exists, out_schema.field_blobs()) if ok
|
|
|
|
|
],
|
|
|
|
|
[
|
|
|
|
|
col_meta for ok, col_meta in
|
|
|
|
|
zip(exists, out_schema.field_metadata()) if ok
|
|
|
|
|
]
|
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
2017-04-17 21:02:44 +00:00
|
|
|
def generate_predict_net(model, include_tags=None):
|
2016-11-14 22:58:04 +00:00
|
|
|
predict_net = core.Net('predict_net')
|
|
|
|
|
|
2017-04-17 21:02:44 +00:00
|
|
|
for layer in _filter_layers(model.layers, include_tags):
|
2017-05-02 16:27:21 +00:00
|
|
|
if Tags.EXCLUDE_FROM_PREDICTION not in layer.tags:
|
2016-11-14 22:58:04 +00:00
|
|
|
layer.add_operators(
|
|
|
|
|
predict_net, context=InstantiationContext.PREDICTION)
|
2017-05-03 00:22:16 +00:00
|
|
|
|
|
|
|
|
predict_net.set_input_record(model.input_feature_schema.clone())
|
2017-05-25 07:10:48 +00:00
|
|
|
output_schema = shrink_output_schema(
|
|
|
|
|
predict_net, model.output_schema.clone()
|
|
|
|
|
)
|
|
|
|
|
predict_net.set_output_record(output_schema)
|
2016-11-14 22:58:04 +00:00
|
|
|
return predict_net
|
|
|
|
|
|
|
|
|
|
|
2017-04-17 21:02:44 +00:00
|
|
|
def generate_eval_net(model, include_tags=None):
|
2017-03-08 04:57:39 +00:00
|
|
|
eval_net = core.Net('eval_net')
|
|
|
|
|
|
2017-04-17 21:02:44 +00:00
|
|
|
for layer in _filter_layers(model.layers, include_tags):
|
2017-05-02 16:27:21 +00:00
|
|
|
if Tags.EXCLUDE_FROM_EVAL not in layer.tags:
|
|
|
|
|
layer.add_operators(eval_net, context=InstantiationContext.EVAL)
|
2017-03-08 04:57:39 +00:00
|
|
|
|
|
|
|
|
input_schema = model.input_feature_schema + model.trainer_extra_schema
|
|
|
|
|
eval_net.set_input_record(input_schema)
|
2017-05-25 07:10:48 +00:00
|
|
|
output_schema = shrink_output_schema(
|
|
|
|
|
eval_net, model.output_schema + model.metrics_schema
|
|
|
|
|
)
|
2017-03-08 04:57:39 +00:00
|
|
|
eval_net.set_output_record(output_schema)
|
|
|
|
|
return eval_net
|
|
|
|
|
|
|
|
|
|
|
2017-04-17 21:02:44 +00:00
|
|
|
def _generate_training_net_only(model, include_tags=None):
|
2016-11-14 22:58:04 +00:00
|
|
|
train_net = core.Net('train_net')
|
|
|
|
|
train_init_net = model.create_init_net('train_init_net')
|
|
|
|
|
|
2017-04-17 21:02:44 +00:00
|
|
|
for layer in _filter_layers(model.layers, include_tags):
|
2017-05-02 16:27:21 +00:00
|
|
|
if Tags.EXCLUDE_FROM_TRAIN not in layer.tags:
|
|
|
|
|
layer.add_operators(train_net, train_init_net)
|
2017-03-09 07:45:31 +00:00
|
|
|
|
|
|
|
|
input_schema = model.input_feature_schema + model.trainer_extra_schema
|
|
|
|
|
train_net.set_input_record(input_schema)
|
2017-05-25 07:10:48 +00:00
|
|
|
output_schema = shrink_output_schema(
|
|
|
|
|
train_net, model.output_schema + model.metrics_schema
|
|
|
|
|
)
|
2017-03-09 07:45:31 +00:00
|
|
|
train_net.set_output_record(output_schema)
|
2017-02-07 20:56:58 +00:00
|
|
|
return train_init_net, train_net
|
|
|
|
|
|
|
|
|
|
|
2017-04-17 21:02:44 +00:00
|
|
|
def generate_training_nets_forward_only(model, include_tags=None):
|
|
|
|
|
train_init_net, train_net = _generate_training_net_only(model, include_tags)
|
2017-02-07 20:56:58 +00:00
|
|
|
return train_init_net, train_net
|
|
|
|
|
|
|
|
|
|
|
2017-04-17 21:02:44 +00:00
|
|
|
def generate_training_nets(model, include_tags=None):
|
|
|
|
|
train_init_net, train_net = _generate_training_net_only(model, include_tags)
|
2017-02-07 20:56:58 +00:00
|
|
|
|
2018-01-08 20:58:21 +00:00
|
|
|
model.apply_regularizers_on_loss(train_net, train_init_net)
|
2018-03-26 18:10:47 +00:00
|
|
|
if not model.has_loss():
|
|
|
|
|
return train_init_net, train_net
|
2017-02-07 20:56:58 +00:00
|
|
|
loss = model.loss
|
2016-11-14 22:58:04 +00:00
|
|
|
grad_map = train_net.AddGradientOperators(loss.field_blobs())
|
2018-04-02 23:35:27 +00:00
|
|
|
model.apply_post_grad_net_modifiers(train_net, train_init_net, grad_map,
|
|
|
|
|
modify_output_record=True)
|
2017-03-25 05:09:30 +00:00
|
|
|
model.apply_optimizers(train_net, train_init_net, grad_map)
|
2018-01-08 20:58:21 +00:00
|
|
|
model.apply_regularizers_after_optimizer(train_net, train_init_net, grad_map)
|
2018-04-02 23:35:27 +00:00
|
|
|
model.apply_final_net_modifiers(train_net, train_init_net, grad_map,
|
|
|
|
|
modify_output_record=True)
|
2018-03-08 21:41:32 +00:00
|
|
|
|
2016-11-14 22:58:04 +00:00
|
|
|
return train_init_net, train_net
|