print('WARNING: nan loss detected, ending training')
returnresults
# Divide by accumulation count
ifaccumulate>1:
loss/=accumulate
# Scale loss by nominal batch_size of 64
loss*=batch_size/64
# Compute gradient
ifmixed_precision:
Reference in New Issue
Block a user
Blocking a user prevents them from interacting with repositories, such as opening or commenting on pull requests or issues. Learn more about blocking a user.