# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
from __future__ import division
import argparse
import logging
import time
import numpy as np
from bottleneck import argpartition
import mxnet as mx
from data import cub200_iterator
from mxnet import gluon
from mxnet.gluon.model_zoo import vision as models
from mxnet import autograd as ag, nd
from model import MarginNet, MarginLoss
logging.basicConfig(level=logging.INFO)
# CLI
parser = argparse.ArgumentParser(description='train a model for image classification.')
parser.add_argument('--data-path', type=str, default='D:\Work\Data/valid1'
'',
help='path of data.')
parser.add_argument('--embed-dim', type=int, default=128,
help='dimensionality of image embedding. default is 128.')
parser.add_argument('--batch-size', type=int, default=70,
help='training batch size per device (CPU/GPU). default is 70.')
parser.add_argument('--batch-k', type=int, default=5,
help='number of images per class in a batch. default is 5.')
parser.add_argument('--gpus', type=str, default='',
help='list of gpus to use, e.g. 0 or 0,2,5. empty means using cpu.')
parser.add_argument('--epochs', type=int, default=20,
help='number of training epochs. default is 20.')
parser.add_argument('--optimizer', type=str, default='adam',
help='optimizer. default is adam.')
parser.add_argument('--lr', type=float, default=0.0001,
help='learning rate. default is 0.0001.')
parser.add_argument('--lr-beta', type=float, default=0.1,
help='learning rate for the beta in margin based loss. default is 0.1.')
parser.add_argument('--margin', type=float, default=0.2,
help='margin for the margin based loss. default is 0.2.')
parser.add_argument('--beta', type=float, default=1.2,
help='initial value for beta. default is 1.2.')
parser.add_argument('--nu', type=float, default=0.0,
help='regularization parameter for beta. default is 0.0.')
parser.add_argument('--factor', type=float, default=0.5,
help='learning rate schedule factor. default is 0.5.')
parser.add_argument('--steps', type=str, default='12,14,16,18',
help='epochs to update learning rate. default is 12,14,16,18.')
parser.add_argument('--wd', type=float, default=0.0001,
help='weight decay rate. default is 0.0001.')
parser.add_argument('--seed', type=int, default=123,
help='random seed to use. default=123.')
parser.add_argument('--model', type=str, default='resnet50_v2',
help='type of model to use. see vision_model for options.')
parser.add_argument('--save-model-prefix', type=str, default='margin_loss_model',
help='prefix of models to be saved.')
parser.add_argument('--use-pretrained', action='store_true',
help='enable using pretrained model from gluon.')
parser.add_argument('--kvstore', type=str, default='device',
help='kvstore to use for trainer.')
parser.add_argument('--log-interval', type=int, default=20,
help='number of batches to wait before logging.')
opt = parser.parse_args()
logging.info(opt)
# Settings.
mx.random.seed(opt.seed)
np.random.seed(opt.seed)
batch_size = opt.batch_size
gpus = [] if opt.gpus is None or opt.gpus is '' else [
int(gpu) for gpu in opt.gpus.split(',')]
num_gpus = len(gpus)
batch_size *= max(1, num_gpus)
context = [mx.gpu(i) for i in gpus] if num_gpus > 0 else [mx.cpu()]
steps = [int(step) for step in opt.steps.split(',')]
# Construct model.
kwargs = {'ctx': context, 'pretrained': opt.use_pretrained}
net = models.get_model(opt.model, **kwargs)
if opt.use_pretrained:
# Use a smaller learning rate for pre-trained convolutional layers.
for v in net.collect_params().values():
if 'conv' in v.name:
setattr(v, 'lr_mult', 0.01)
net.hybridize()
net = MarginNet(net.features, opt.embed_dim, opt.batch_k)
beta = mx.gluon.Parameter('beta', shape=(100,))
# Get iterators.
train_data, val_data = cub200_iterator(opt.data_path, opt.batch_k, batch_size, (3, 224, 224))
def get_distance_matrix(x):
"""Get distance matrix given a matrix. Used in testing."""
square = nd.sum(x ** 2.0, axis=1, keepdims=True)
distance_square = square + square.transpose() - (2.0 * nd.dot(x, x.transpose()))
return nd.sqrt(distance_square)
def evaluate_emb(emb, labels):
"""Evaluate embeddings based on Recall@k."""
d_mat = get_distance_matrix(emb)
d_mat = d_mat.asnumpy()
labels = labels.asnumpy()
names = []
accs = []
for k in [1, 2, 4, 8, 16]:
names.append('Recall@%d' % k)
correct, cnt = 0.0, 0.0
for i in range(emb.shape[0]):
d_mat[i, i] = 1e10
nns = argpartition(d_mat[i], k)[:k]
if any(labels[i] == labels[nn] for nn in nns):
correct += 1
cnt += 1
accs.append(correct/cnt)
return names, accs
def test(ctx):
"""Test a model."""
val_data.reset()
outputs = []
labels = []
for batch in val_data:
data = gluon.utils.split_and_load(batch.data[0], ctx_list=ctx, batch_axis=0)
label = gluon.utils.split_and_load(batch.label[0], ctx_list=ctx, batch_axis=0)
for x in data:
outputs.append(net(x)[-1])
labels += label
outputs = nd.concatenate(outputs, axis=0)[:val_data.n_test]
labels = nd.concatenate(labels, axis=0)[:val_data.n_test]
return evaluate_emb(outputs, labels)
def get_lr(lr, epoch, steps, factor):
"""Get learning rate based on schedule."""
for s in steps:
if epoch >= s:
lr *= factor
return lr
def train(epochs, ctx):
"""Training function."""
if isinstance(ctx, mx.Context):
ctx = [ctx]
net.initialize(mx.init.Xavier(magnitude=2), ctx=ctx)
opt_options = {'learning_rate': opt.lr, 'wd': opt.wd}
if opt.optimizer == 'sgd':
opt_options['momentum'] = 0.9
if opt.optimizer == 'adam':
opt_options['epsilon'] = 1e-7
trainer = gluon.Trainer(net.collect_params(), opt.optimizer,
opt_options,
kvstore=opt.kvstore)
if opt.lr_beta > 0.0:
# Jointly train class-specific beta.
# See "sampling matters in deep embedding learning" paper for details.
beta.initialize(mx.init.Constant(opt.beta), ctx=ctx)
trainer_beta = gluon.Trainer([beta], 'sgd',
{'learning_rate': opt.lr_beta, 'momentum': 0.9},
kvstore=opt.kvstore)
loss = MarginLoss(margin=opt.margin, nu=opt.nu)
best_val = 0.0
for epoch in range(epochs):
tic = time.time()
prev_loss, cumulative_loss = 0.0, 0.0
# Learning rate schedule.
trainer.set_learning_rate(get_lr(opt.lr, epoch, steps, opt.factor))
logging.info('Epoch %d learning rate=%f', epoch, trainer.learning_rate)
if opt.lr_beta > 0.0:
trainer_beta.set_learning_rate(get_lr(opt.
weixin_42653672
- 粉丝: 110
- 资源: 1万+
最新资源
- 小数分频锁相环,环形振荡器结构,smic28nm,有版图,有很多设计原理ppt文档等
- langchain的详解与应用
- 基于VSG控制(同步发电机控制)的模块化多电平变流器MMC 通过设置可编程电源,模拟电网频率和电压改变, 观测MMC输出功率的变化情况 初步设定值电网线电压U=10kV;Pref=10e6;Qref=
- 永磁同步电机旋转高频信号注入法零低速无位置控制仿真,相比高频方波信号注入法,旋转高频信号注入法噪声更小损耗更低
- 在MySQL中使用查询扩展的全文搜索和全文搜索停用词.pdf
- simulink光伏并同步发电机,光伏减载,留出备用进行频率惯量支撑,减小对同步发电机的依赖 频率支撑效果好,波形效果好,非一般仿真 可以改变光强,温度以及减载率
- 机械设计PCB自动清洗线step非常好的设计图纸100%好用.zip
- Qt CPP实现的多列时间轴控件、可与多段字符串格式自由转、也可手动添加列表项、专门用来以时间轴作为事件线发展顺序的故事大纲 时间可输入任意内容,不限于时间,每一时间段允许多列,即多个文字节点,行与
- 类和对象资料学习文档备份
- 构网变流器功率控制控制(dq坐标系) 1)dq旋转坐标系下实现下垂控制; 2)无功下垂采用比例积分控制,能够实现功率准确、快速无静差跟踪; 3)采用电压电流双闭环、电压前馈实现准确电压跟踪
- 模型预测控制(MPC)+路径跟踪(PTC)+侧偏角软约束+主动前轮转向(AFS),目前的范例是72km h,附着系数0.3的单移线,附着系数0.85双移线 仿真使用的是MATLAB2020b版本和c
- 机械设计布料拉平裁切机sw18可编辑非常好的设计图纸100%好用.zip
- Python的安装及运行PDF
- 非线性七自由度车辆simulink模型,基于魔术公式,同时提供二,三自由度车辆模型,发整套 汽车操作稳定性模型,考虑四个车轮转动,考虑汽车侧向纵向运动 提供,参考lunwen 提供二自由度车辆动
- 无线充电仿真 simulink 磁耦合谐振 无线电能传输 MCR WPT lcc ss llc拓扑补偿 一共四套模型: 1.llc谐振器实现12 24V恒压输出 带调频控制 附参考文献和讲解视频
- 机械设计齿轮箱滚珠模块装配step非常好的设计图纸100%好用.zip
资源上传下载、课程学习等过程中有任何疑问或建议,欢迎提出宝贵意见哦~我们会及时处理!
点击此处反馈
评论0