[name for name,para in model.named_parameters() if para.grad==None]
TORCH_DISTRIBUTED_DEBUG=DETAIL bash train.sh