代码拉取完成,页面将自动刷新
from __future__ import absolute_import
from __future__ import division
from __future__ import print_function
import glob
import logging
import os
from math import inf
import numpy as np
import tensorflow as tf
import config
from data_reading import processors
from data_reading.batcher import Batcher, EvalData
from inference import inference
from model_pools import modeling, model_pools
from utils.metric_utils import calculate_reward
from utils.utils import print_parameters, pprint_params
def create_train_model(hps):
model = model_pools[hps.model_name]
bert_config = modeling.BertConfig.from_json_file(hps.bert_config_file)
bert_config.max_position_embeddings = max(bert_config.max_position_embeddings, hps.max_out_seq_length * 2)
if hps.max_seq_length > bert_config.max_position_embeddings:
raise ValueError(
'Cannot use sequence length %d because the BERT model '
'was only trained up to sequence length %d' %
(hps.max_seq_length, bert_config.max_position_embeddings))
tf.gfile.MakeDirs(hps.output_dir)
# load custom processer from task name
task_name = hps.task_name.lower()
if task_name not in processors:
raise ValueError('Task not found: %s' % task_name)
processor = processors[task_name](hps)
print('processor!!!!', processor)
train_batcher = Batcher(processor, hps)
print("create trainning model...")
# create trainning model
train_model = model(bert_config, train_batcher, hps)
train_model.create_or_load_recent_model()
logging.info('Total train steps: {}, total warm_up steps: {}...'.format(train_model.num_train_steps,
train_model.num_warmup_steps))
logging.info(
'Init lr: {}, current lr: {}'.format(hps.learning_rate,
train_model.load_specific_variable(train_model.cur_lr)))
print("create trainning model done")
return train_model
def create_eval_model(hps):
model = model_pools[hps.model_name]
bert_config = modeling.BertConfig.from_json_file(hps.bert_config_file)
bert_config.max_position_embeddings = max(bert_config.max_position_embeddings, hps.max_out_seq_length * 2)
if hps.max_seq_length > bert_config.max_position_embeddings:
raise ValueError(
'Cannot use sequence length %d because the BERT model '
'was only trained up to sequence length %d' %
(hps.max_seq_length, bert_config.max_position_embeddings))
tf.gfile.MakeDirs(hps.output_dir)
task_name = hps.task_name.lower()
if task_name not in processors:
raise ValueError('Task not found: %s' % task_name)
processor = processors[task_name](hps)
hps.mode = 'dev' # use dev set to choose best model
batcher = Batcher(processor, hps)
# create eval model
print("create eval model...")
model = model(bert_config, batcher, hps)
all_ckpt = [ckpt.split('.')[0] for ckpt in glob.glob(os.path.join(hps.output_dir, '*.index'))]
print("create eval model done")
return model, all_ckpt
def train(hps):
bert_model = create_train_model(hps)
checkpoint_basename = os.path.join(hps.output_dir, hps.model_name)
logging.info(checkpoint_basename)
bert_model.save_model(checkpoint_basename)
start_step = bert_model.load_specific_variable(bert_model.global_step)
if start_step == 0:
print_parameters(bert_model.graph, output_detail=True, output_to_logging=True)
if hps.debug and start_step == 0:
# figure out how many GPU memory used
batch = bert_model.batcher.next_batch()
bert_model.figure_out_memory_usage(batch)
print('Start training ...')
avg_loss = []
run_reward = hasattr(bert_model, 'run_reward') and callable(bert_model.run_reward)
former_loss = inf
for step in range(start_step, bert_model.num_train_steps):
# feed draft or ground-truth
feed_draft = step > hps.start_portion_to_feed_draft * bert_model.num_train_steps \
and step % hps.draft_feed_freq == 0
for i in range(hps.accumulate_step - 1): # gradient accumulation
batch = bert_model.batcher.next_batch()
batch.feed_draft = np.array(feed_draft, dtype=np.bool)
if run_reward:
batch_pred_ids = bert_model.run_reward(batch)['pred_ids'] # [b, length]
batch.reward = calculate_reward(batch_pred_ids, batch, hps.padId)
bert_model.run_grad_accum_step(batch)
batch.reward = None
batch = bert_model.batcher.next_batch()
batch.feed_draft = np.array(feed_draft, dtype=np.bool)
if run_reward:
batch_pred_ids = bert_model.run_reward(batch)['pred_ids'] # [b, length]
batch.reward = calculate_reward(batch_pred_ids, batch, hps.padId)
bert_model.run_grad_accum_step(batch)
batch.reward = None
results = bert_model.run_train_step(batch)
avg_loss.append(results['loss'])
bert_model.summary_writer.add_summary(results['summaries'], step)
if step % 100 == 0:
this_loss = sum(avg_loss) / len(avg_loss)
if this_loss > former_loss and this_loss - former_loss > 0.5:
bert_model.create_or_load_recent_model()
logging.info('former loss:{}, this loss"{}, reload'.format(former_loss, this_loss))
former_loss = this_loss
logging.info('step {}, 100 steps avg loss: {}\n'.format(step, sum(avg_loss) / len(avg_loss)))
avg_loss = []
bert_model.summary_writer.flush()
if step % hps.evaluate_every_n_step == 0:
bert_model.save_model(checkpoint_basename, with_step=True)
bert_model.save_model(checkpoint_basename, with_step=True)
def eval_best_ckpt(hps):
checkpoint_basename = os.path.join(hps.output_dir, hps.model_name)
eval_model, all_ckpt = create_eval_model(hps)
best_eval_loss, best_ckpt = inf, None
batcher = EvalData(hps)
run_reward = hasattr(eval_model, 'run_reward') and callable(eval_model.run_reward)
for each_ckpt in all_ckpt:
logging.info('Start evaluate performance of ckpt: {}'.format(each_ckpt))
batcher.restart()
eval_model.load_specific_model(each_ckpt)
loss_all = []
step = 0
while True:
batch = batcher.next_batch()
step += 1
if batch is None:
break
batch.feed_draft = np.array(True, dtype=np.bool)
if batch.source_ids.shape[0] != hps.eval_batch_size:
logging.warning('Purge {} samples, '
'as sample num != eval_batch_size ({})'.format(batch.source_ids.shape[0],
hps.eval_batch_size))
continue
if step % 100 == 0:
logging.info('step {}, avg loss: {}\n'.format(step, sum(loss_all) / len(loss_all)))
if run_reward:
batch_pred_ids = eval_model.run_reward(batch)['pred_ids'] # [b, length]
batch.reward = calculate_reward(batch_pred_ids, batch, hps.padId)
results = eval_model.run_dev_step(batch)
loss_all.append(results['loss'])
loss = np.average(loss_all)
if loss < best_eval_loss:
best_eval_loss = loss
best_ckpt = each_ckpt
logging.info('ckpt: {}, dev loss: {}, best loss: {}'.format(each_ckpt, loss, best_eval_loss))
# load and save best model
eval_model.load_specific_model(best_ckpt)
eval_model.save_model(checkpoint_basename + 'best', True)
def main(_):
FLAGS = config.parse_args()
FLAGS.train_batch_size = int(len(FLAGS.gpu) * FLAGS.train_batch_size)
print('orign_accu', FLAGS.accumulate_step)
FLAGS.accumulate_step = int(int(4 / len(FLAGS.gpu)) * FLAGS.accumulate_step)
print('Num_GPUS', len(FLAGS.gpu))
print('batch_size', FLAGS.train_batch_size)
print('accumulate_step', FLAGS.accumulate_step)
basic_format = '%(asctime)s - %(name)s - %(levelname)s - %(message)s'
formatter = logging.Formatter(basic_format)
if FLAGS.log_file and not os.path.exists(os.path.dirname(FLAGS.log_file)):
os.makedirs(os.path.dirname(FLAGS.log_file))
if FLAGS.log_file:
handler = logging.FileHandler(FLAGS.log_file, 'a', 'utf-8')
handler.setFormatter(formatter)
handlers = [handler]
else:
handlers = None
logging.basicConfig(level=logging.INFO,
format=basic_format,
handlers=handlers)
logging.info('-' * 80 + '[' + FLAGS.mode + ']' + '-' * 80)
logging.info('Starting seq2seq_attention in %s mode...', FLAGS.mode)
logging.info(pprint_params(FLAGS))
if FLAGS.mode == 'train':
train(FLAGS)
elif FLAGS.mode == 'eval':
eval_best_ckpt(FLAGS)
elif FLAGS.mode == 'dev':
inference(FLAGS)
elif FLAGS.mode == 'test':
inference(FLAGS)
else:
raise ValueError('The `mode` flag must be one of train/dev/test')
if __name__ == '__main__':
tf.app.run()
此处可能存在不合适展示的内容,页面不予展示。您可通过相关编辑功能自查并修改。
如您确认内容无涉及 不当用语 / 纯广告导流 / 暴力 / 低俗色情 / 侵权 / 盗版 / 虚假 / 无价值内容或违法国家有关法律法规的内容,可点击提交进行申诉,我们将尽快为您处理。