[name for name,para in model.named_parameters() if para.grad==None] TORCH_DISTRIBUTED_DEBUG=DETAIL bash train.sh