gpu

package
v2.14.1 Latest Latest
Warning

This package is not in the latest version of its module.

Go to latest
Published: Dec 8, 2023 License: BSD-3-Clause Imports: 9 Imported by: 0

Documentation

Index

Constants

This section is empty.

Variables

View Source
var (
	GemmBackendConfig_Epilogue_name = map[int32]string{
		0: "DEFAULT",
		1: "BIAS",
		2: "RELU",
		3: "BIAS_RELU",
		4: "GELU",
		5: "GELU_AUX",
		6: "BIAS_GELU",
		7: "BIAS_GELU_AUX",
	}
	GemmBackendConfig_Epilogue_value = map[string]int32{
		"DEFAULT":       0,
		"BIAS":          1,
		"RELU":          2,
		"BIAS_RELU":     3,
		"GELU":          4,
		"GELU_AUX":      5,
		"BIAS_GELU":     6,
		"BIAS_GELU_AUX": 7,
	}
)

Enum value maps for GemmBackendConfig_Epilogue.

View Source
var File_tensorflow_compiler_xla_service_gpu_backend_configs_proto protoreflect.FileDescriptor
View Source
var File_tensorflow_compiler_xla_service_gpu_executable_proto protoreflect.FileDescriptor
View Source
var File_tensorflow_compiler_xla_service_gpu_gpu_autotuning_proto protoreflect.FileDescriptor
View Source
var File_tensorflow_compiler_xla_service_gpu_hlo_op_profile_proto protoreflect.FileDescriptor

Functions

This section is empty.

Types

type AlgorithmDenylist

type AlgorithmDenylist struct {
	Entries []*AlgorithmDenylistEntry `protobuf:"bytes,1,rep,name=entries,proto3" json:"entries,omitempty"`
	// contains filtered or unexported fields
}

func (*AlgorithmDenylist) Descriptor deprecated

func (*AlgorithmDenylist) Descriptor() ([]byte, []int)

Deprecated: Use AlgorithmDenylist.ProtoReflect.Descriptor instead.

func (*AlgorithmDenylist) GetEntries

func (x *AlgorithmDenylist) GetEntries() []*AlgorithmDenylistEntry

func (*AlgorithmDenylist) ProtoMessage

func (*AlgorithmDenylist) ProtoMessage()

func (*AlgorithmDenylist) ProtoReflect

func (x *AlgorithmDenylist) ProtoReflect() protoreflect.Message

func (*AlgorithmDenylist) Reset

func (x *AlgorithmDenylist) Reset()

func (*AlgorithmDenylist) String

func (x *AlgorithmDenylist) String() string

type AlgorithmDenylistEntry

type AlgorithmDenylistEntry struct {
	Hlo          string                 `protobuf:"bytes,1,opt,name=hlo,proto3" json:"hlo,omitempty"`
	Cc           *xla.ComputeCapability `protobuf:"bytes,2,opt,name=cc,proto3" json:"cc,omitempty"`
	CudnnVersion *xla.CudnnVersion      `protobuf:"bytes,3,opt,name=cudnn_version,json=cudnnVersion,proto3" json:"cudnn_version,omitempty"`
	BlasVersion  string                 `protobuf:"bytes,5,opt,name=blas_version,json=blasVersion,proto3" json:"blas_version,omitempty"`
	Algos        []*DenylistedAlgorithm `protobuf:"bytes,4,rep,name=algos,proto3" json:"algos,omitempty"`
	// contains filtered or unexported fields
}

func (*AlgorithmDenylistEntry) Descriptor deprecated

func (*AlgorithmDenylistEntry) Descriptor() ([]byte, []int)

Deprecated: Use AlgorithmDenylistEntry.ProtoReflect.Descriptor instead.

func (*AlgorithmDenylistEntry) GetAlgos

func (*AlgorithmDenylistEntry) GetBlasVersion

func (x *AlgorithmDenylistEntry) GetBlasVersion() string

func (*AlgorithmDenylistEntry) GetCc

func (*AlgorithmDenylistEntry) GetCudnnVersion

func (x *AlgorithmDenylistEntry) GetCudnnVersion() *xla.CudnnVersion

func (*AlgorithmDenylistEntry) GetHlo

func (x *AlgorithmDenylistEntry) GetHlo() string

func (*AlgorithmDenylistEntry) ProtoMessage

func (*AlgorithmDenylistEntry) ProtoMessage()

func (*AlgorithmDenylistEntry) ProtoReflect

func (x *AlgorithmDenylistEntry) ProtoReflect() protoreflect.Message

func (*AlgorithmDenylistEntry) Reset

func (x *AlgorithmDenylistEntry) Reset()

func (*AlgorithmDenylistEntry) String

func (x *AlgorithmDenylistEntry) String() string

type BitcastBackendConfig

type BitcastBackendConfig struct {
	SourceLayout *data.LayoutProto `protobuf:"bytes,1,opt,name=source_layout,json=sourceLayout,proto3" json:"source_layout,omitempty"`
	ResultLayout *data.LayoutProto `protobuf:"bytes,2,opt,name=result_layout,json=resultLayout,proto3" json:"result_layout,omitempty"`
	// contains filtered or unexported fields
}

Backend config for bitcast operation generated from MLIR MHLO dialect.

func (*BitcastBackendConfig) Descriptor deprecated

func (*BitcastBackendConfig) Descriptor() ([]byte, []int)

Deprecated: Use BitcastBackendConfig.ProtoReflect.Descriptor instead.

func (*BitcastBackendConfig) GetResultLayout

func (x *BitcastBackendConfig) GetResultLayout() *data.LayoutProto

func (*BitcastBackendConfig) GetSourceLayout

func (x *BitcastBackendConfig) GetSourceLayout() *data.LayoutProto

func (*BitcastBackendConfig) ProtoMessage

func (*BitcastBackendConfig) ProtoMessage()

func (*BitcastBackendConfig) ProtoReflect

func (x *BitcastBackendConfig) ProtoReflect() protoreflect.Message

func (*BitcastBackendConfig) Reset

func (x *BitcastBackendConfig) Reset()

func (*BitcastBackendConfig) String

func (x *BitcastBackendConfig) String() string

type CollectiveBackendConfig added in v2.13.0

type CollectiveBackendConfig struct {
	IsSync bool `protobuf:"varint,1,opt,name=is_sync,json=isSync,proto3" json:"is_sync,omitempty"`
	// contains filtered or unexported fields
}

Backend config for async collective operations. Note that for is_sync will be false by default, so even if a backend config is not explicitly attached to the HLOInstruction, getting the backend_config will yield a default valued proto which will have is_sync = false.

func (*CollectiveBackendConfig) Descriptor deprecated added in v2.13.0

func (*CollectiveBackendConfig) Descriptor() ([]byte, []int)

Deprecated: Use CollectiveBackendConfig.ProtoReflect.Descriptor instead.

func (*CollectiveBackendConfig) GetIsSync added in v2.13.0

func (x *CollectiveBackendConfig) GetIsSync() bool

func (*CollectiveBackendConfig) ProtoMessage added in v2.13.0

func (*CollectiveBackendConfig) ProtoMessage()

func (*CollectiveBackendConfig) ProtoReflect added in v2.13.0

func (x *CollectiveBackendConfig) ProtoReflect() protoreflect.Message

func (*CollectiveBackendConfig) Reset added in v2.13.0

func (x *CollectiveBackendConfig) Reset()

func (*CollectiveBackendConfig) String added in v2.13.0

func (x *CollectiveBackendConfig) String() string

type ConvInstructionLog

type ConvInstructionLog struct {
	Instruction      *service.HloInstructionProto `protobuf:"bytes,1,opt,name=instruction,proto3" json:"instruction,omitempty"`
	OperandShapes    []*data.ShapeProto           `protobuf:"bytes,2,rep,name=operand_shapes,json=operandShapes,proto3" json:"operand_shapes,omitempty"`
	ResultAddress    uint64                       `protobuf:"varint,3,opt,name=result_address,json=resultAddress,proto3" json:"result_address,omitempty"`
	OperandAddresses []uint64                     `protobuf:"varint,4,rep,packed,name=operand_addresses,json=operandAddresses,proto3" json:"operand_addresses,omitempty"`
	// contains filtered or unexported fields
}

func (*ConvInstructionLog) Descriptor deprecated

func (*ConvInstructionLog) Descriptor() ([]byte, []int)

Deprecated: Use ConvInstructionLog.ProtoReflect.Descriptor instead.

func (*ConvInstructionLog) GetInstruction

func (x *ConvInstructionLog) GetInstruction() *service.HloInstructionProto

func (*ConvInstructionLog) GetOperandAddresses

func (x *ConvInstructionLog) GetOperandAddresses() []uint64

func (*ConvInstructionLog) GetOperandShapes

func (x *ConvInstructionLog) GetOperandShapes() []*data.ShapeProto

func (*ConvInstructionLog) GetResultAddress

func (x *ConvInstructionLog) GetResultAddress() uint64

func (*ConvInstructionLog) ProtoMessage

func (*ConvInstructionLog) ProtoMessage()

func (*ConvInstructionLog) ProtoReflect

func (x *ConvInstructionLog) ProtoReflect() protoreflect.Message

func (*ConvInstructionLog) Reset

func (x *ConvInstructionLog) Reset()

func (*ConvInstructionLog) String

func (x *ConvInstructionLog) String() string

type CudnnConvBackendConfig

type CudnnConvBackendConfig struct {

	// Opaque algorithm number and tuning knobs chosen for this conv.
	Algorithm *protobuf.AlgorithmProto `protobuf:"bytes,6,opt,name=algorithm,proto3" json:"algorithm,omitempty"`
	// The scaling factor multiplied with the convolution result.
	ConvResultScale float64 `protobuf:"fixed64,4,opt,name=conv_result_scale,json=convResultScale,proto3" json:"conv_result_scale,omitempty"`
	// The requested activation (e.g. relu) after the convolution.
	ActivationMode protobuf.ActivationMode `` /* 144-byte string literal not displayed */
	// The scaling factor multiplied with the side input. If no side input buffer
	// is provided, this field must be 0.
	SideInputScale float64 `protobuf:"fixed64,5,opt,name=side_input_scale,json=sideInputScale,proto3" json:"side_input_scale,omitempty"`
	// The negative slope coefficient alpha for leaky_relu activation, used only
	// when activation_mode is kLeakyRelu.
	//
	// leakyrelu(x) is defined as x > 0 ? x : alpha * x.
	//
	// Since this is a proto3 proto, leakyrelu_alpha is 0 if not specified (in
	// which case the leakyrelu activation is equivalent to relu).
	LeakyreluAlpha float64 `protobuf:"fixed64,8,opt,name=leakyrelu_alpha,json=leakyreluAlpha,proto3" json:"leakyrelu_alpha,omitempty"`
	// If the filter (and bias, if present) have been reordered, set this flag.
	// It's placed into a `oneof` block to skip the serialization when not set.
	//
	// Types that are assignable to FilterAndBiasReorderingOneof:
	//
	//	*CudnnConvBackendConfig_ReorderedInt8NchwVect
	FilterAndBiasReorderingOneof isCudnnConvBackendConfig_FilterAndBiasReorderingOneof `protobuf_oneof:"filter_and_bias_reordering_oneof"`
	// Serialization of the graph described by the convolution and adjacent
	// pointwise ops.
	SerializedGraph *string `protobuf:"bytes,9,opt,name=serialized_graph,json=serializedGraph,proto3,oneof" json:"serialized_graph,omitempty"`
	// contains filtered or unexported fields
}

Backend config for a convolution that runs through cudnn.

func (*CudnnConvBackendConfig) Descriptor deprecated

func (*CudnnConvBackendConfig) Descriptor() ([]byte, []int)

Deprecated: Use CudnnConvBackendConfig.ProtoReflect.Descriptor instead.

func (*CudnnConvBackendConfig) GetActivationMode

func (x *CudnnConvBackendConfig) GetActivationMode() protobuf.ActivationMode

func (*CudnnConvBackendConfig) GetAlgorithm

func (x *CudnnConvBackendConfig) GetAlgorithm() *protobuf.AlgorithmProto

func (*CudnnConvBackendConfig) GetConvResultScale

func (x *CudnnConvBackendConfig) GetConvResultScale() float64

func (*CudnnConvBackendConfig) GetFilterAndBiasReorderingOneof added in v2.13.0

func (m *CudnnConvBackendConfig) GetFilterAndBiasReorderingOneof() isCudnnConvBackendConfig_FilterAndBiasReorderingOneof

func (*CudnnConvBackendConfig) GetLeakyreluAlpha added in v2.14.0

func (x *CudnnConvBackendConfig) GetLeakyreluAlpha() float64

func (*CudnnConvBackendConfig) GetReorderedInt8NchwVect added in v2.13.0

func (x *CudnnConvBackendConfig) GetReorderedInt8NchwVect() bool

func (*CudnnConvBackendConfig) GetSerializedGraph added in v2.14.0

func (x *CudnnConvBackendConfig) GetSerializedGraph() string

func (*CudnnConvBackendConfig) GetSideInputScale

func (x *CudnnConvBackendConfig) GetSideInputScale() float64

func (*CudnnConvBackendConfig) ProtoMessage

func (*CudnnConvBackendConfig) ProtoMessage()

func (*CudnnConvBackendConfig) ProtoReflect

func (x *CudnnConvBackendConfig) ProtoReflect() protoreflect.Message

func (*CudnnConvBackendConfig) Reset

func (x *CudnnConvBackendConfig) Reset()

func (*CudnnConvBackendConfig) String

func (x *CudnnConvBackendConfig) String() string

type CudnnConvBackendConfig_ReorderedInt8NchwVect added in v2.13.0

type CudnnConvBackendConfig_ReorderedInt8NchwVect struct {
	// cuDNN int8x32 vectorized convolutions (NCHW_VECT_C data layout) can be
	// optimized by reordering the filter and bias (if present). The logical
	// layout stays the same, but the data is shuffled in a way that is
	// compatible with NVidia's IMMA instruction (sm75+).
	ReorderedInt8NchwVect bool `protobuf:"varint,7,opt,name=reordered_int8_nchw_vect,json=reorderedInt8NchwVect,proto3,oneof"`
}

type CudnnfMHABackendConfig added in v2.14.0

type CudnnfMHABackendConfig struct {

	// Opaque algorithm number and tuning knobs chosen for this fMHA.
	Algorithm *protobuf.AlgorithmProto `protobuf:"bytes,8,opt,name=algorithm,proto3" json:"algorithm,omitempty"`
	// The scaling factor multiplied with the BMM1 result. fmha_scale is 1 if the
	// MHA pattern has no scaling.
	FmhaScale float64 `protobuf:"fixed64,10,opt,name=fmha_scale,json=fmhaScale,proto3" json:"fmha_scale,omitempty"`
	// Dropout factor in MHA
	DropoutRate float64 `protobuf:"fixed64,13,opt,name=dropout_rate,json=dropoutRate,proto3" json:"dropout_rate,omitempty"`
	// Configs for mha bmms in the forward graph
	Bmm1DotDimensionNumbers *data.DotDimensionNumbers `` /* 135-byte string literal not displayed */
	Bmm2DotDimensionNumbers *data.DotDimensionNumbers `` /* 135-byte string literal not displayed */
	IntermediateTensorShape *data.ShapeProto          `` /* 133-byte string literal not displayed */
	// Configs for mha bmms in the backward graph
	Bmm1GradGemm1DotDimensionNumbers *data.DotDimensionNumbers `` /* 166-byte string literal not displayed */
	Bmm1GradGemm2DotDimensionNumbers *data.DotDimensionNumbers `` /* 166-byte string literal not displayed */
	Bmm2GradGemm1DotDimensionNumbers *data.DotDimensionNumbers `` /* 166-byte string literal not displayed */
	Bmm2GradGemm2DotDimensionNumbers *data.DotDimensionNumbers `` /* 166-byte string literal not displayed */
	// Random seed used by dropout
	Seed int64 `protobuf:"varint,15,opt,name=seed,proto3" json:"seed,omitempty"`
	// contains filtered or unexported fields
}

Backend config for a fused Multi-Headed Attention (fMHA) that runs through cudnn.

func (*CudnnfMHABackendConfig) Descriptor deprecated added in v2.14.0

func (*CudnnfMHABackendConfig) Descriptor() ([]byte, []int)

Deprecated: Use CudnnfMHABackendConfig.ProtoReflect.Descriptor instead.

func (*CudnnfMHABackendConfig) GetAlgorithm added in v2.14.0

func (x *CudnnfMHABackendConfig) GetAlgorithm() *protobuf.AlgorithmProto

func (*CudnnfMHABackendConfig) GetBmm1DotDimensionNumbers added in v2.14.0

func (x *CudnnfMHABackendConfig) GetBmm1DotDimensionNumbers() *data.DotDimensionNumbers

func (*CudnnfMHABackendConfig) GetBmm1GradGemm1DotDimensionNumbers added in v2.14.0

func (x *CudnnfMHABackendConfig) GetBmm1GradGemm1DotDimensionNumbers() *data.DotDimensionNumbers

func (*CudnnfMHABackendConfig) GetBmm1GradGemm2DotDimensionNumbers added in v2.14.0

func (x *CudnnfMHABackendConfig) GetBmm1GradGemm2DotDimensionNumbers() *data.DotDimensionNumbers

func (*CudnnfMHABackendConfig) GetBmm2DotDimensionNumbers added in v2.14.0

func (x *CudnnfMHABackendConfig) GetBmm2DotDimensionNumbers() *data.DotDimensionNumbers

func (*CudnnfMHABackendConfig) GetBmm2GradGemm1DotDimensionNumbers added in v2.14.0

func (x *CudnnfMHABackendConfig) GetBmm2GradGemm1DotDimensionNumbers() *data.DotDimensionNumbers

func (*CudnnfMHABackendConfig) GetBmm2GradGemm2DotDimensionNumbers added in v2.14.0

func (x *CudnnfMHABackendConfig) GetBmm2GradGemm2DotDimensionNumbers() *data.DotDimensionNumbers

func (*CudnnfMHABackendConfig) GetDropoutRate added in v2.14.0

func (x *CudnnfMHABackendConfig) GetDropoutRate() float64

func (*CudnnfMHABackendConfig) GetFmhaScale added in v2.14.0

func (x *CudnnfMHABackendConfig) GetFmhaScale() float64

func (*CudnnfMHABackendConfig) GetIntermediateTensorShape added in v2.14.0

func (x *CudnnfMHABackendConfig) GetIntermediateTensorShape() *data.ShapeProto

func (*CudnnfMHABackendConfig) GetSeed added in v2.14.0

func (x *CudnnfMHABackendConfig) GetSeed() int64

func (*CudnnfMHABackendConfig) ProtoMessage added in v2.14.0

func (*CudnnfMHABackendConfig) ProtoMessage()

func (*CudnnfMHABackendConfig) ProtoReflect added in v2.14.0

func (x *CudnnfMHABackendConfig) ProtoReflect() protoreflect.Message

func (*CudnnfMHABackendConfig) Reset added in v2.14.0

func (x *CudnnfMHABackendConfig) Reset()

func (*CudnnfMHABackendConfig) String added in v2.14.0

func (x *CudnnfMHABackendConfig) String() string

type DenylistedAlgorithm

type DenylistedAlgorithm struct {
	Id        int64 `protobuf:"varint,1,opt,name=id,proto3" json:"id,omitempty"`
	TensorOps bool  `protobuf:"varint,2,opt,name=tensor_ops,json=tensorOps,proto3" json:"tensor_ops,omitempty"`
	// contains filtered or unexported fields
}

func (*DenylistedAlgorithm) Descriptor deprecated

func (*DenylistedAlgorithm) Descriptor() ([]byte, []int)

Deprecated: Use DenylistedAlgorithm.ProtoReflect.Descriptor instead.

func (*DenylistedAlgorithm) GetId

func (x *DenylistedAlgorithm) GetId() int64

func (*DenylistedAlgorithm) GetTensorOps

func (x *DenylistedAlgorithm) GetTensorOps() bool

func (*DenylistedAlgorithm) ProtoMessage

func (*DenylistedAlgorithm) ProtoMessage()

func (*DenylistedAlgorithm) ProtoReflect

func (x *DenylistedAlgorithm) ProtoReflect() protoreflect.Message

func (*DenylistedAlgorithm) Reset

func (x *DenylistedAlgorithm) Reset()

func (*DenylistedAlgorithm) String

func (x *DenylistedAlgorithm) String() string

type DeviceHloInstructionProfiles added in v2.14.0

type DeviceHloInstructionProfiles struct {
	Entries map[string]*HloInstructionProfileList `` /* 155-byte string literal not displayed */
	// contains filtered or unexported fields
}

func (*DeviceHloInstructionProfiles) Descriptor deprecated added in v2.14.0

func (*DeviceHloInstructionProfiles) Descriptor() ([]byte, []int)

Deprecated: Use DeviceHloInstructionProfiles.ProtoReflect.Descriptor instead.

func (*DeviceHloInstructionProfiles) GetEntries added in v2.14.0

func (*DeviceHloInstructionProfiles) ProtoMessage added in v2.14.0

func (*DeviceHloInstructionProfiles) ProtoMessage()

func (*DeviceHloInstructionProfiles) ProtoReflect added in v2.14.0

func (*DeviceHloInstructionProfiles) Reset added in v2.14.0

func (x *DeviceHloInstructionProfiles) Reset()

func (*DeviceHloInstructionProfiles) String added in v2.14.0

type FusionBackendConfig added in v2.14.0

type FusionBackendConfig struct {

	// kLoop, kInput, or kOutput (from HloInstruction::FusionKind), or your own
	// custom string.
	//
	// Don't put "kCustom" in here -- just put a string describing the custom
	// fusion, like "__triton_gemm".
	//
	// This is somewhat redundant with HloInstruction::fusion_kind().  We need it
	// here because LMHLO does not have the concept of a fusion kind, and we use
	// this same backend-config proto for both HLO and LMHLO.
	Kind string `protobuf:"bytes,1,opt,name=kind,proto3" json:"kind,omitempty"`
	// Only valid when kind == "__triton_gemm".  Even then it's optional: If not
	// present, we use the default Triton config.
	TritonGemmConfig *xla.AutotuneResult_TritonGemmKey `protobuf:"bytes,2,opt,name=triton_gemm_config,json=tritonGemmConfig,proto3" json:"triton_gemm_config,omitempty"`
	// Cost model prediction.
	ReificationCost *ReificationCost `protobuf:"bytes,3,opt,name=reification_cost,json=reificationCost,proto3" json:"reification_cost,omitempty"`
	// contains filtered or unexported fields
}

func (*FusionBackendConfig) Descriptor deprecated added in v2.14.0

func (*FusionBackendConfig) Descriptor() ([]byte, []int)

Deprecated: Use FusionBackendConfig.ProtoReflect.Descriptor instead.

func (*FusionBackendConfig) GetKind added in v2.14.0

func (x *FusionBackendConfig) GetKind() string

func (*FusionBackendConfig) GetReificationCost added in v2.14.0

func (x *FusionBackendConfig) GetReificationCost() *ReificationCost

func (*FusionBackendConfig) GetTritonGemmConfig added in v2.14.0

func (x *FusionBackendConfig) GetTritonGemmConfig() *xla.AutotuneResult_TritonGemmKey

func (*FusionBackendConfig) ProtoMessage added in v2.14.0

func (*FusionBackendConfig) ProtoMessage()

func (*FusionBackendConfig) ProtoReflect added in v2.14.0

func (x *FusionBackendConfig) ProtoReflect() protoreflect.Message

func (*FusionBackendConfig) Reset added in v2.14.0

func (x *FusionBackendConfig) Reset()

func (*FusionBackendConfig) String added in v2.14.0

func (x *FusionBackendConfig) String() string

type GemmBackendConfig

type GemmBackendConfig struct {

	// Opaque optional algorithm number. No chosen number indicates that a
	// different cuBLAS API will be used, which does not allow for choosing an
	// algorithm.
	//
	// Types that are assignable to Algorithm:
	//
	//	*GemmBackendConfig_SelectedAlgorithm
	Algorithm           isGemmBackendConfig_Algorithm `protobuf_oneof:"algorithm"`
	AlphaReal           float64                       `protobuf:"fixed64,2,opt,name=alpha_real,json=alphaReal,proto3" json:"alpha_real,omitempty"`
	AlphaImag           float64                       `protobuf:"fixed64,9,opt,name=alpha_imag,json=alphaImag,proto3" json:"alpha_imag,omitempty"`
	Beta                float64                       `protobuf:"fixed64,3,opt,name=beta,proto3" json:"beta,omitempty"`
	DotDimensionNumbers *data.DotDimensionNumbers     `protobuf:"bytes,7,opt,name=dot_dimension_numbers,json=dotDimensionNumbers,proto3" json:"dot_dimension_numbers,omitempty"`
	PrecisionConfig     *data.PrecisionConfig         `protobuf:"bytes,12,opt,name=precision_config,json=precisionConfig,proto3" json:"precision_config,omitempty"`
	Epilogue            GemmBackendConfig_Epilogue    `protobuf:"varint,13,opt,name=epilogue,proto3,enum=xla.gpu.GemmBackendConfig_Epilogue" json:"epilogue,omitempty"`
	// contains filtered or unexported fields
}

Backend config for the GEMM operation running through cuBLAS.

func (*GemmBackendConfig) Descriptor deprecated

func (*GemmBackendConfig) Descriptor() ([]byte, []int)

Deprecated: Use GemmBackendConfig.ProtoReflect.Descriptor instead.

func (*GemmBackendConfig) GetAlgorithm

func (m *GemmBackendConfig) GetAlgorithm() isGemmBackendConfig_Algorithm

func (*GemmBackendConfig) GetAlphaImag

func (x *GemmBackendConfig) GetAlphaImag() float64

func (*GemmBackendConfig) GetAlphaReal

func (x *GemmBackendConfig) GetAlphaReal() float64

func (*GemmBackendConfig) GetBeta

func (x *GemmBackendConfig) GetBeta() float64

func (*GemmBackendConfig) GetDotDimensionNumbers

func (x *GemmBackendConfig) GetDotDimensionNumbers() *data.DotDimensionNumbers

func (*GemmBackendConfig) GetEpilogue

func (*GemmBackendConfig) GetPrecisionConfig

func (x *GemmBackendConfig) GetPrecisionConfig() *data.PrecisionConfig

func (*GemmBackendConfig) GetSelectedAlgorithm

func (x *GemmBackendConfig) GetSelectedAlgorithm() int64

func (*GemmBackendConfig) ProtoMessage

func (*GemmBackendConfig) ProtoMessage()

func (*GemmBackendConfig) ProtoReflect

func (x *GemmBackendConfig) ProtoReflect() protoreflect.Message

func (*GemmBackendConfig) Reset

func (x *GemmBackendConfig) Reset()

func (*GemmBackendConfig) String

func (x *GemmBackendConfig) String() string

type GemmBackendConfig_Epilogue

type GemmBackendConfig_Epilogue int32

cublasLt matmul epilogue.

const (
	GemmBackendConfig_DEFAULT       GemmBackendConfig_Epilogue = 0
	GemmBackendConfig_BIAS          GemmBackendConfig_Epilogue = 1
	GemmBackendConfig_RELU          GemmBackendConfig_Epilogue = 2
	GemmBackendConfig_BIAS_RELU     GemmBackendConfig_Epilogue = 3
	GemmBackendConfig_GELU          GemmBackendConfig_Epilogue = 4
	GemmBackendConfig_GELU_AUX      GemmBackendConfig_Epilogue = 5
	GemmBackendConfig_BIAS_GELU     GemmBackendConfig_Epilogue = 6
	GemmBackendConfig_BIAS_GELU_AUX GemmBackendConfig_Epilogue = 7
)

func (GemmBackendConfig_Epilogue) Descriptor

func (GemmBackendConfig_Epilogue) Enum

func (GemmBackendConfig_Epilogue) EnumDescriptor deprecated

func (GemmBackendConfig_Epilogue) EnumDescriptor() ([]byte, []int)

Deprecated: Use GemmBackendConfig_Epilogue.Descriptor instead.

func (GemmBackendConfig_Epilogue) Number

func (GemmBackendConfig_Epilogue) String

func (GemmBackendConfig_Epilogue) Type

type GemmBackendConfig_SelectedAlgorithm

type GemmBackendConfig_SelectedAlgorithm struct {
	SelectedAlgorithm int64 `protobuf:"varint,1,opt,name=selected_algorithm,json=selectedAlgorithm,proto3,oneof"`
}

type HloInstructionProfile added in v2.14.0

type HloInstructionProfile struct {
	Instruction *service.HloInstructionProto `protobuf:"bytes,1,opt,name=instruction,proto3" json:"instruction,omitempty"`
	ClockCycles int64                        `protobuf:"varint,2,opt,name=clock_cycles,json=clockCycles,proto3" json:"clock_cycles,omitempty"`
	// contains filtered or unexported fields
}

func (*HloInstructionProfile) Descriptor deprecated added in v2.14.0

func (*HloInstructionProfile) Descriptor() ([]byte, []int)

Deprecated: Use HloInstructionProfile.ProtoReflect.Descriptor instead.

func (*HloInstructionProfile) GetClockCycles added in v2.14.0

func (x *HloInstructionProfile) GetClockCycles() int64

func (*HloInstructionProfile) GetInstruction added in v2.14.0

func (x *HloInstructionProfile) GetInstruction() *service.HloInstructionProto

func (*HloInstructionProfile) ProtoMessage added in v2.14.0

func (*HloInstructionProfile) ProtoMessage()

func (*HloInstructionProfile) ProtoReflect added in v2.14.0

func (x *HloInstructionProfile) ProtoReflect() protoreflect.Message

func (*HloInstructionProfile) Reset added in v2.14.0

func (x *HloInstructionProfile) Reset()

func (*HloInstructionProfile) String added in v2.14.0

func (x *HloInstructionProfile) String() string

type HloInstructionProfileList added in v2.14.0

type HloInstructionProfileList struct {
	Entries []*HloInstructionProfile `protobuf:"bytes,1,rep,name=entries,proto3" json:"entries,omitempty"`
	// contains filtered or unexported fields
}

func (*HloInstructionProfileList) Descriptor deprecated added in v2.14.0

func (*HloInstructionProfileList) Descriptor() ([]byte, []int)

Deprecated: Use HloInstructionProfileList.ProtoReflect.Descriptor instead.

func (*HloInstructionProfileList) GetEntries added in v2.14.0

func (*HloInstructionProfileList) ProtoMessage added in v2.14.0

func (*HloInstructionProfileList) ProtoMessage()

func (*HloInstructionProfileList) ProtoReflect added in v2.14.0

func (*HloInstructionProfileList) Reset added in v2.14.0

func (x *HloInstructionProfileList) Reset()

func (*HloInstructionProfileList) String added in v2.14.0

func (x *HloInstructionProfileList) String() string

type ReificationCost added in v2.14.0

type ReificationCost struct {
	EndToEndCycles float64 `protobuf:"fixed64,1,opt,name=end_to_end_cycles,json=endToEndCycles,proto3" json:"end_to_end_cycles,omitempty"` // Total execution time of the reified op.
	// contains filtered or unexported fields
}

func (*ReificationCost) Descriptor deprecated added in v2.14.0

func (*ReificationCost) Descriptor() ([]byte, []int)

Deprecated: Use ReificationCost.ProtoReflect.Descriptor instead.

func (*ReificationCost) GetEndToEndCycles added in v2.14.0

func (x *ReificationCost) GetEndToEndCycles() float64

func (*ReificationCost) ProtoMessage added in v2.14.0

func (*ReificationCost) ProtoMessage()

func (*ReificationCost) ProtoReflect added in v2.14.0

func (x *ReificationCost) ProtoReflect() protoreflect.Message

func (*ReificationCost) Reset added in v2.14.0

func (x *ReificationCost) Reset()

func (*ReificationCost) String added in v2.14.0

func (x *ReificationCost) String() string

type XlaRuntimeGpuExecutableProto added in v2.11.0

type XlaRuntimeGpuExecutableProto struct {
	XlaRuntimeExecutable *service.XlaRuntimeExecutableProto `protobuf:"bytes,1,opt,name=xla_runtime_executable,json=xlaRuntimeExecutable,proto3" json:"xla_runtime_executable,omitempty"`
	// XLA-specific attributes of the executable's entry function.
	EntryFuncAttrs *service.EntryFunctionAttributes `protobuf:"bytes,2,opt,name=entry_func_attrs,json=entryFuncAttrs,proto3" json:"entry_func_attrs,omitempty"`
	// PTX for the compiled GPU kernels.
	GpuAsmText string `protobuf:"bytes,3,opt,name=gpu_asm_text,json=gpuAsmText,proto3" json:"gpu_asm_text,omitempty"`
	// Corresponding CUBIN for the above PTX.
	GpuBinary []byte `protobuf:"bytes,4,opt,name=gpu_binary,json=gpuBinary,proto3" json:"gpu_binary,omitempty"`
	// Constants required by the serialized executable.
	Constants []*XlaRuntimeGpuExecutableProto_ConstantInfoProto `protobuf:"bytes,5,rep,name=constants,proto3" json:"constants,omitempty"`
	// contains filtered or unexported fields
}

func (*XlaRuntimeGpuExecutableProto) Descriptor deprecated added in v2.11.0

func (*XlaRuntimeGpuExecutableProto) Descriptor() ([]byte, []int)

Deprecated: Use XlaRuntimeGpuExecutableProto.ProtoReflect.Descriptor instead.

func (*XlaRuntimeGpuExecutableProto) GetConstants added in v2.12.0

func (*XlaRuntimeGpuExecutableProto) GetEntryFuncAttrs added in v2.12.0

func (*XlaRuntimeGpuExecutableProto) GetGpuAsmText added in v2.11.0

func (x *XlaRuntimeGpuExecutableProto) GetGpuAsmText() string

func (*XlaRuntimeGpuExecutableProto) GetGpuBinary added in v2.11.0

func (x *XlaRuntimeGpuExecutableProto) GetGpuBinary() []byte

func (*XlaRuntimeGpuExecutableProto) GetXlaRuntimeExecutable added in v2.11.0

func (x *XlaRuntimeGpuExecutableProto) GetXlaRuntimeExecutable() *service.XlaRuntimeExecutableProto

func (*XlaRuntimeGpuExecutableProto) ProtoMessage added in v2.11.0

func (*XlaRuntimeGpuExecutableProto) ProtoMessage()

func (*XlaRuntimeGpuExecutableProto) ProtoReflect added in v2.11.0

func (*XlaRuntimeGpuExecutableProto) Reset added in v2.11.0

func (x *XlaRuntimeGpuExecutableProto) Reset()

func (*XlaRuntimeGpuExecutableProto) String added in v2.11.0

type XlaRuntimeGpuExecutableProto_ConstantInfoProto added in v2.12.0

type XlaRuntimeGpuExecutableProto_ConstantInfoProto struct {
	SymbolName      string `protobuf:"bytes,1,opt,name=symbol_name,json=symbolName,proto3" json:"symbol_name,omitempty"`
	Content         []byte `protobuf:"bytes,2,opt,name=content,proto3" json:"content,omitempty"`
	AllocationIndex int32  `protobuf:"varint,3,opt,name=allocation_index,json=allocationIndex,proto3" json:"allocation_index,omitempty"`
	// contains filtered or unexported fields
}

func (*XlaRuntimeGpuExecutableProto_ConstantInfoProto) Descriptor deprecated added in v2.12.0

Deprecated: Use XlaRuntimeGpuExecutableProto_ConstantInfoProto.ProtoReflect.Descriptor instead.

func (*XlaRuntimeGpuExecutableProto_ConstantInfoProto) GetAllocationIndex added in v2.12.0

func (x *XlaRuntimeGpuExecutableProto_ConstantInfoProto) GetAllocationIndex() int32

func (*XlaRuntimeGpuExecutableProto_ConstantInfoProto) GetContent added in v2.12.0

func (*XlaRuntimeGpuExecutableProto_ConstantInfoProto) GetSymbolName added in v2.12.0

func (*XlaRuntimeGpuExecutableProto_ConstantInfoProto) ProtoMessage added in v2.12.0

func (*XlaRuntimeGpuExecutableProto_ConstantInfoProto) ProtoReflect added in v2.12.0

func (*XlaRuntimeGpuExecutableProto_ConstantInfoProto) Reset added in v2.12.0

func (*XlaRuntimeGpuExecutableProto_ConstantInfoProto) String added in v2.12.0

Jump to

Keyboard shortcuts

? : This menu
/ : Search site
f or F : Jump to
y or Y : Canonical URL