adam_test1.py 613 B

123456789101112131415161718192021222324
  1. # Copyright (c) Microsoft Corporation.
  2. # SPDX-License-Identifier: Apache-2.0
  3. # DeepSpeed Team
  4. import torch
  5. from deepspeed.ops.adam import DeepSpeedCPUAdam
  6. import time
  7. device = 'cpu'
  8. model_size = 1 * 1024**3
  9. param = torch.nn.Parameter(torch.ones(model_size, device=device))
  10. optimizer = DeepSpeedCPUAdam([param])
  11. #torch.set_num_threads(128)
  12. param.grad = torch.ones(model_size, device=device)
  13. avg = 0
  14. for i in range(100):
  15. start = time.time()
  16. optimizer.step()
  17. stop = time.time()
  18. avg += (stop - start)
  19. param.grad = torch.ones(model_size, device=device) * 2
  20. print("Elapsed Time is ", avg / 100)