pytorch.rst 2.54 KB
Newer Older
Przemek Tredak's avatar
Przemek Tredak committed
1
..
2
    Copyright (c) 2022-2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
Przemek Tredak's avatar
Przemek Tredak committed
3
4
5
6
7
8

    See LICENSE for license information.

pyTorch
=======

9
.. autoapiclass:: transformer_engine.pytorch.Linear(in_features, out_features, bias=True, **kwargs)
10
  :members: forward, set_tensor_parallel_group
Przemek Tredak's avatar
Przemek Tredak committed
11

12
13
14
.. autoapiclass:: transformer_engine.pytorch.GroupedLinear(in_features, out_features, bias=True, **kwargs)
  :members: forward, set_tensor_parallel_group

15
.. autoapiclass:: transformer_engine.pytorch.LayerNorm(hidden_size, eps=1e-5, **kwargs)
Przemek Tredak's avatar
Przemek Tredak committed
16

17
18
.. autoapiclass:: transformer_engine.pytorch.RMSNorm(hidden_size, eps=1e-5, **kwargs)

19
.. autoapiclass:: transformer_engine.pytorch.LayerNormLinear(in_features, out_features, eps=1e-5, bias=True, **kwargs)
20
  :members: forward, set_tensor_parallel_group
Przemek Tredak's avatar
Przemek Tredak committed
21

22
.. autoapiclass:: transformer_engine.pytorch.LayerNormMLP(hidden_size, ffn_hidden_size, eps=1e-5, bias=True, **kwargs)
23
  :members: forward, set_tensor_parallel_group
Przemek Tredak's avatar
Przemek Tredak committed
24

25
.. autoapiclass:: transformer_engine.pytorch.DotProductAttention(num_attention_heads, kv_channels, **kwargs)
26
  :members: forward, set_context_parallel_group
cyanguwa's avatar
cyanguwa committed
27

28
.. autoapiclass:: transformer_engine.pytorch.MultiheadAttention(hidden_size, num_attention_heads, **kwargs)
29
  :members: forward, set_context_parallel_group, set_tensor_parallel_group
30

31
.. autoapiclass:: transformer_engine.pytorch.TransformerLayer(hidden_size, ffn_hidden_size, num_attention_heads, **kwargs)
32
  :members: forward, set_context_parallel_group, set_tensor_parallel_group
Przemek Tredak's avatar
Przemek Tredak committed
33

34
35
.. autoapiclass:: transformer_engine.pytorch.InferenceParams(max_batch_size, max_sequence_length)

36
37
38
.. autoapiclass:: transformer_engine.pytorch.CudaRNGStatesTracker()
  :members: reset, get_states, set_states, add, fork

39
.. autoapifunction:: transformer_engine.pytorch.fp8_autocast
40

41
42
.. autoapifunction:: transformer_engine.pytorch.fp8_model_init

43
.. autoapifunction:: transformer_engine.pytorch.checkpoint
44

45
46
.. autoapifunction:: transformer_engine.pytorch.make_graphed_callables

47
.. autoapifunction:: transformer_engine.pytorch.get_cpu_offload_context
48
49
50

.. autoapifunction:: transformer_engine.pytorch.moe_permute

51
52
.. autoapifunction:: transformer_engine.pytorch.moe_permute_with_probs  

53
.. autoapifunction:: transformer_engine.pytorch.moe_unpermute
54

55
56
.. autoapifunction:: transformer_engine.pytorch.moe_sort_chunks_by_index

57
58
.. autoapifunction:: transformer_engine.pytorch.parallel_cross_entropy

59
60
.. autoapifunction:: transformer_engine.pytorch.moe_sort_chunks_by_index_with_probs

61
62
63
.. autoapifunction:: transformer_engine.pytorch.initialize_ub

.. autoapifunction:: transformer_engine.pytorch.destroy_ub