stream_executor

package
v2.14.1 Latest Latest
Warning

This package is not in the latest version of its module.

Go to latest
Published: Dec 8, 2023 License: BSD-3-Clause Imports: 6 Imported by: 0

Documentation

Index

Constants

View Source
const ActivationMode_kBandPass = protobuf.ActivationMode_kBandPass
View Source
const ActivationMode_kElu = protobuf.ActivationMode_kElu
View Source
const ActivationMode_kGeluExact = protobuf.ActivationMode_kGeluExact
View Source
const ActivationMode_kLeakyRelu = protobuf.ActivationMode_kLeakyRelu
View Source
const ActivationMode_kNone = protobuf.ActivationMode_kNone
View Source
const ActivationMode_kRelu = protobuf.ActivationMode_kRelu
View Source
const ActivationMode_kRelu6 = protobuf.ActivationMode_kRelu6
View Source
const ActivationMode_kReluX = protobuf.ActivationMode_kReluX
View Source
const ActivationMode_kSigmoid = protobuf.ActivationMode_kSigmoid
View Source
const ActivationMode_kTanh = protobuf.ActivationMode_kTanh
View Source
const AlgorithmProto_DEFAULT_MATH = protobuf.AlgorithmProto_DEFAULT_MATH
View Source
const AlgorithmProto_TENSOR_OP_MATH = protobuf.AlgorithmProto_TENSOR_OP_MATH
View Source
const ConvolutionKind_BACKWARD_DATA = protobuf.ConvolutionKind_BACKWARD_DATA
View Source
const ConvolutionKind_BACKWARD_FILTER = protobuf.ConvolutionKind_BACKWARD_FILTER
View Source
const ConvolutionKind_FORWARD = protobuf.ConvolutionKind_FORWARD
View Source
const ConvolutionKind_FORWARD_BIAS_ACTIVATION = protobuf.ConvolutionKind_FORWARD_BIAS_ACTIVATION
View Source
const ConvolutionKind_FORWARD_GRAPH = protobuf.ConvolutionKind_FORWARD_GRAPH
View Source
const ConvolutionKind_INVALID = protobuf.ConvolutionKind_INVALID
View Source
const ConvolutionMode_CONVOLUTION = protobuf.ConvolutionMode_CONVOLUTION
View Source
const ConvolutionMode_CROSS_CORRELATION = protobuf.ConvolutionMode_CROSS_CORRELATION
View Source
const DataLayout_kBatchDepthYX = protobuf.DataLayout_kBatchDepthYX
View Source
const DataLayout_kBatchDepthYX32 = protobuf.DataLayout_kBatchDepthYX32
View Source
const DataLayout_kBatchDepthYX4 = protobuf.DataLayout_kBatchDepthYX4
View Source
const DataLayout_kBatchYXDepth = protobuf.DataLayout_kBatchYXDepth
View Source
const DataLayout_kYXBatchDepth = protobuf.DataLayout_kYXBatchDepth
View Source
const DataLayout_kYXDepthBatch = protobuf.DataLayout_kYXDepthBatch
View Source
const DataType_kBF16 = protobuf.DataType_kBF16
View Source
const DataType_kComplexDouble = protobuf.DataType_kComplexDouble
View Source
const DataType_kComplexFloat = protobuf.DataType_kComplexFloat
View Source
const DataType_kDouble = protobuf.DataType_kDouble
View Source
const DataType_kF8E4M3FN = protobuf.DataType_kF8E4M3FN
View Source
const DataType_kF8E4M3FNUZ = protobuf.DataType_kF8E4M3FNUZ
View Source
const DataType_kF8E5M2 = protobuf.DataType_kF8E5M2
View Source
const DataType_kF8E5M2FNUZ = protobuf.DataType_kF8E5M2FNUZ
View Source
const DataType_kFloat = protobuf.DataType_kFloat
View Source
const DataType_kHalf = protobuf.DataType_kHalf
View Source
const DataType_kInt32 = protobuf.DataType_kInt32
View Source
const DataType_kInt64 = protobuf.DataType_kInt64
View Source
const DataType_kInt8 = protobuf.DataType_kInt8
View Source
const FilterLayout_kInputYXOutput = protobuf.FilterLayout_kInputYXOutput
View Source
const FilterLayout_kOutputInputYX = protobuf.FilterLayout_kOutputInputYX
View Source
const FilterLayout_kOutputInputYX32 = protobuf.FilterLayout_kOutputInputYX32
View Source
const FilterLayout_kOutputInputYX32_CudnnReordered = protobuf.FilterLayout_kOutputInputYX32_CudnnReordered
View Source
const FilterLayout_kOutputInputYX4 = protobuf.FilterLayout_kOutputInputYX4
View Source
const FilterLayout_kOutputYXInput = protobuf.FilterLayout_kOutputYXInput
View Source
const FilterLayout_kYXInputOutput = protobuf.FilterLayout_kYXInputOutput
View Source
const FusedMHAKind_BMM1_OUTPUT_FLOAT = protobuf.FusedMHAKind_BMM1_OUTPUT_FLOAT
View Source
const FusedMHAKind_BMM1_OUTPUT_INPUT_TYPE = protobuf.FusedMHAKind_BMM1_OUTPUT_INPUT_TYPE
View Source
const FusedMHAKind_BMM1_OUTPUT_UNKNOWN = protobuf.FusedMHAKind_BMM1_OUTPUT_UNKNOWN

Variables

View Source
var ActivationMode_name = protobuf.ActivationMode_name
View Source
var ActivationMode_value = protobuf.ActivationMode_value
View Source
var AlgorithmProto_MathType_name = protobuf.AlgorithmProto_MathType_name
View Source
var AlgorithmProto_MathType_value = protobuf.AlgorithmProto_MathType_value
View Source
var ConvolutionKind_name = protobuf.ConvolutionKind_name
View Source
var ConvolutionKind_value = protobuf.ConvolutionKind_value
View Source
var ConvolutionMode_name = protobuf.ConvolutionMode_name
View Source
var ConvolutionMode_value = protobuf.ConvolutionMode_value
View Source
var DataLayout_name = protobuf.DataLayout_name
View Source
var DataLayout_value = protobuf.DataLayout_value
View Source
var DataType_name = protobuf.DataType_name
View Source
var DataType_value = protobuf.DataType_value
View Source
var File_tensorflow_compiler_xla_stream_executor_device_description_proto protoreflect.FileDescriptor
View Source
var File_tensorflow_compiler_xla_stream_executor_dnn_proto protoreflect.FileDescriptor
View Source
var FilterLayout_name = protobuf.FilterLayout_name
View Source
var FilterLayout_value = protobuf.FilterLayout_value
View Source
var FusedMHAKind_name = protobuf.FusedMHAKind_name
View Source
var FusedMHAKind_value = protobuf.FusedMHAKind_value

Functions

This section is empty.

Types

type ActivationMode

type ActivationMode = protobuf.ActivationMode

type AlgorithmConfigProto

type AlgorithmConfigProto = protobuf.AlgorithmConfigProto

type AlgorithmConfigProto_Algorithm

type AlgorithmConfigProto_Algorithm = protobuf.AlgorithmConfigProto_Algorithm

type AlgorithmConfigProto_ScratchSize

type AlgorithmConfigProto_ScratchSize = protobuf.AlgorithmConfigProto_ScratchSize

type AlgorithmProto

type AlgorithmProto = protobuf.AlgorithmProto

type AlgorithmProto_MathType

type AlgorithmProto_MathType = protobuf.AlgorithmProto_MathType

type ConvolutionDescriptorProto

type ConvolutionDescriptorProto = protobuf.ConvolutionDescriptorProto

type ConvolutionKind

type ConvolutionKind = protobuf.ConvolutionKind

type ConvolutionMode

type ConvolutionMode = protobuf.ConvolutionMode

type CudaComputeCapabilityProto added in v2.12.0

type CudaComputeCapabilityProto struct {
	Major int32 `protobuf:"varint,1,opt,name=major,proto3" json:"major,omitempty"`
	Minor int32 `protobuf:"varint,2,opt,name=minor,proto3" json:"minor,omitempty"`
	// contains filtered or unexported fields
}

func (*CudaComputeCapabilityProto) Descriptor deprecated added in v2.12.0

func (*CudaComputeCapabilityProto) Descriptor() ([]byte, []int)

Deprecated: Use CudaComputeCapabilityProto.ProtoReflect.Descriptor instead.

func (*CudaComputeCapabilityProto) GetMajor added in v2.12.0

func (x *CudaComputeCapabilityProto) GetMajor() int32

func (*CudaComputeCapabilityProto) GetMinor added in v2.12.0

func (x *CudaComputeCapabilityProto) GetMinor() int32

func (*CudaComputeCapabilityProto) ProtoMessage added in v2.12.0

func (*CudaComputeCapabilityProto) ProtoMessage()

func (*CudaComputeCapabilityProto) ProtoReflect added in v2.12.0

func (*CudaComputeCapabilityProto) Reset added in v2.12.0

func (x *CudaComputeCapabilityProto) Reset()

func (*CudaComputeCapabilityProto) String added in v2.12.0

func (x *CudaComputeCapabilityProto) String() string

type DataLayout

type DataLayout = protobuf.DataLayout

type DataType

type DataType = protobuf.DataType

type DnnVersionInfoProto added in v2.12.0

type DnnVersionInfoProto struct {
	Major int32 `protobuf:"varint,1,opt,name=major,proto3" json:"major,omitempty"`
	Minor int32 `protobuf:"varint,2,opt,name=minor,proto3" json:"minor,omitempty"`
	Patch int32 `protobuf:"varint,3,opt,name=patch,proto3" json:"patch,omitempty"`
	// contains filtered or unexported fields
}

func (*DnnVersionInfoProto) Descriptor deprecated added in v2.12.0

func (*DnnVersionInfoProto) Descriptor() ([]byte, []int)

Deprecated: Use DnnVersionInfoProto.ProtoReflect.Descriptor instead.

func (*DnnVersionInfoProto) GetMajor added in v2.12.0

func (x *DnnVersionInfoProto) GetMajor() int32

func (*DnnVersionInfoProto) GetMinor added in v2.12.0

func (x *DnnVersionInfoProto) GetMinor() int32

func (*DnnVersionInfoProto) GetPatch added in v2.12.0

func (x *DnnVersionInfoProto) GetPatch() int32

func (*DnnVersionInfoProto) ProtoMessage added in v2.12.0

func (*DnnVersionInfoProto) ProtoMessage()

func (*DnnVersionInfoProto) ProtoReflect added in v2.12.0

func (x *DnnVersionInfoProto) ProtoReflect() protoreflect.Message

func (*DnnVersionInfoProto) Reset added in v2.12.0

func (x *DnnVersionInfoProto) Reset()

func (*DnnVersionInfoProto) String added in v2.12.0

func (x *DnnVersionInfoProto) String() string

type FilterLayout

type FilterLayout = protobuf.FilterLayout

type FusedMHAKind added in v2.13.0

type FusedMHAKind = protobuf.FusedMHAKind

type GpuDeviceInfoProto added in v2.12.0

type GpuDeviceInfoProto struct {
	ThreadsPerBlockLimit      int32   `` /* 126-byte string literal not displayed */
	ThreadsPerWarp            int32   `protobuf:"varint,2,opt,name=threads_per_warp,json=threadsPerWarp,proto3" json:"threads_per_warp,omitempty"`
	SharedMemoryPerBlock      int32   `` /* 126-byte string literal not displayed */
	SharedMemoryPerCore       int32   `protobuf:"varint,4,opt,name=shared_memory_per_core,json=sharedMemoryPerCore,proto3" json:"shared_memory_per_core,omitempty"`
	ThreadsPerCoreLimit       int32   `protobuf:"varint,5,opt,name=threads_per_core_limit,json=threadsPerCoreLimit,proto3" json:"threads_per_core_limit,omitempty"`
	CoreCount                 int32   `protobuf:"varint,6,opt,name=core_count,json=coreCount,proto3" json:"core_count,omitempty"`
	FpusPerCore               int64   `protobuf:"varint,7,opt,name=fpus_per_core,json=fpusPerCore,proto3" json:"fpus_per_core,omitempty"`
	BlockDimLimitX            int32   `protobuf:"varint,8,opt,name=block_dim_limit_x,json=blockDimLimitX,proto3" json:"block_dim_limit_x,omitempty"`
	BlockDimLimitY            int32   `protobuf:"varint,9,opt,name=block_dim_limit_y,json=blockDimLimitY,proto3" json:"block_dim_limit_y,omitempty"`
	BlockDimLimitZ            int32   `protobuf:"varint,10,opt,name=block_dim_limit_z,json=blockDimLimitZ,proto3" json:"block_dim_limit_z,omitempty"`
	MemoryBandwidth           int64   `protobuf:"varint,11,opt,name=memory_bandwidth,json=memoryBandwidth,proto3" json:"memory_bandwidth,omitempty"`
	L2CacheSize               int64   `protobuf:"varint,12,opt,name=l2_cache_size,json=l2CacheSize,proto3" json:"l2_cache_size,omitempty"`
	ClockRateGhz              float32 `protobuf:"fixed32,13,opt,name=clock_rate_ghz,json=clockRateGhz,proto3" json:"clock_rate_ghz,omitempty"`
	DeviceMemorySize          int64   `protobuf:"varint,14,opt,name=device_memory_size,json=deviceMemorySize,proto3" json:"device_memory_size,omitempty"`
	SharedMemoryPerBlockOptin int32   `` /* 144-byte string literal not displayed */
	// contains filtered or unexported fields
}

func (*GpuDeviceInfoProto) Descriptor deprecated added in v2.12.0

func (*GpuDeviceInfoProto) Descriptor() ([]byte, []int)

Deprecated: Use GpuDeviceInfoProto.ProtoReflect.Descriptor instead.

func (*GpuDeviceInfoProto) GetBlockDimLimitX added in v2.12.0

func (x *GpuDeviceInfoProto) GetBlockDimLimitX() int32

func (*GpuDeviceInfoProto) GetBlockDimLimitY added in v2.12.0

func (x *GpuDeviceInfoProto) GetBlockDimLimitY() int32

func (*GpuDeviceInfoProto) GetBlockDimLimitZ added in v2.12.0

func (x *GpuDeviceInfoProto) GetBlockDimLimitZ() int32

func (*GpuDeviceInfoProto) GetClockRateGhz added in v2.12.0

func (x *GpuDeviceInfoProto) GetClockRateGhz() float32

func (*GpuDeviceInfoProto) GetCoreCount added in v2.12.0

func (x *GpuDeviceInfoProto) GetCoreCount() int32

func (*GpuDeviceInfoProto) GetDeviceMemorySize added in v2.12.0

func (x *GpuDeviceInfoProto) GetDeviceMemorySize() int64

func (*GpuDeviceInfoProto) GetFpusPerCore added in v2.12.0

func (x *GpuDeviceInfoProto) GetFpusPerCore() int64

func (*GpuDeviceInfoProto) GetL2CacheSize added in v2.12.0

func (x *GpuDeviceInfoProto) GetL2CacheSize() int64

func (*GpuDeviceInfoProto) GetMemoryBandwidth added in v2.12.0

func (x *GpuDeviceInfoProto) GetMemoryBandwidth() int64

func (*GpuDeviceInfoProto) GetSharedMemoryPerBlock added in v2.12.0

func (x *GpuDeviceInfoProto) GetSharedMemoryPerBlock() int32

func (*GpuDeviceInfoProto) GetSharedMemoryPerBlockOptin added in v2.13.0

func (x *GpuDeviceInfoProto) GetSharedMemoryPerBlockOptin() int32

func (*GpuDeviceInfoProto) GetSharedMemoryPerCore added in v2.12.0

func (x *GpuDeviceInfoProto) GetSharedMemoryPerCore() int32

func (*GpuDeviceInfoProto) GetThreadsPerBlockLimit added in v2.12.0

func (x *GpuDeviceInfoProto) GetThreadsPerBlockLimit() int32

func (*GpuDeviceInfoProto) GetThreadsPerCoreLimit added in v2.12.0

func (x *GpuDeviceInfoProto) GetThreadsPerCoreLimit() int32

func (*GpuDeviceInfoProto) GetThreadsPerWarp added in v2.12.0

func (x *GpuDeviceInfoProto) GetThreadsPerWarp() int32

func (*GpuDeviceInfoProto) ProtoMessage added in v2.12.0

func (*GpuDeviceInfoProto) ProtoMessage()

func (*GpuDeviceInfoProto) ProtoReflect added in v2.12.0

func (x *GpuDeviceInfoProto) ProtoReflect() protoreflect.Message

func (*GpuDeviceInfoProto) Reset added in v2.12.0

func (x *GpuDeviceInfoProto) Reset()

func (*GpuDeviceInfoProto) String added in v2.12.0

func (x *GpuDeviceInfoProto) String() string

type GpuTargetConfigProto added in v2.12.0

type GpuTargetConfigProto struct {
	GpuDeviceInfo *GpuDeviceInfoProto `protobuf:"bytes,1,opt,name=gpu_device_info,json=gpuDeviceInfo,proto3" json:"gpu_device_info,omitempty"`
	// Types that are assignable to ComputeCapability:
	//
	//	*GpuTargetConfigProto_CudaComputeCapability
	//	*GpuTargetConfigProto_RocmComputeCapability
	ComputeCapability isGpuTargetConfigProto_ComputeCapability `protobuf_oneof:"compute_capability"`
	PlatformName      string                                   `protobuf:"bytes,4,opt,name=platform_name,json=platformName,proto3" json:"platform_name,omitempty"`
	DnnVersionInfo    *DnnVersionInfoProto                     `protobuf:"bytes,5,opt,name=dnn_version_info,json=dnnVersionInfo,proto3" json:"dnn_version_info,omitempty"`
	// TODO(b/248362914): Autotuning results should be separate from
	// GpuTargetConfig because autotuning can be updated regularly separate from
	// the target.
	AutotuneResults      *xla.AutotuneResults `protobuf:"bytes,6,opt,name=autotune_results,json=autotuneResults,proto3" json:"autotune_results,omitempty"`
	DeviceDescriptionStr string               `protobuf:"bytes,7,opt,name=device_description_str,json=deviceDescriptionStr,proto3" json:"device_description_str,omitempty"`
	// contains filtered or unexported fields
}

func (*GpuTargetConfigProto) Descriptor deprecated added in v2.12.0

func (*GpuTargetConfigProto) Descriptor() ([]byte, []int)

Deprecated: Use GpuTargetConfigProto.ProtoReflect.Descriptor instead.

func (*GpuTargetConfigProto) GetAutotuneResults added in v2.12.0

func (x *GpuTargetConfigProto) GetAutotuneResults() *xla.AutotuneResults

func (*GpuTargetConfigProto) GetComputeCapability added in v2.12.0

func (m *GpuTargetConfigProto) GetComputeCapability() isGpuTargetConfigProto_ComputeCapability

func (*GpuTargetConfigProto) GetCudaComputeCapability added in v2.12.0

func (x *GpuTargetConfigProto) GetCudaComputeCapability() *CudaComputeCapabilityProto

func (*GpuTargetConfigProto) GetDeviceDescriptionStr added in v2.12.0

func (x *GpuTargetConfigProto) GetDeviceDescriptionStr() string

func (*GpuTargetConfigProto) GetDnnVersionInfo added in v2.12.0

func (x *GpuTargetConfigProto) GetDnnVersionInfo() *DnnVersionInfoProto

func (*GpuTargetConfigProto) GetGpuDeviceInfo added in v2.12.0

func (x *GpuTargetConfigProto) GetGpuDeviceInfo() *GpuDeviceInfoProto

func (*GpuTargetConfigProto) GetPlatformName added in v2.12.0

func (x *GpuTargetConfigProto) GetPlatformName() string

func (*GpuTargetConfigProto) GetRocmComputeCapability added in v2.12.0

func (x *GpuTargetConfigProto) GetRocmComputeCapability() *RocmComputeCapabilityProto

func (*GpuTargetConfigProto) ProtoMessage added in v2.12.0

func (*GpuTargetConfigProto) ProtoMessage()

func (*GpuTargetConfigProto) ProtoReflect added in v2.12.0

func (x *GpuTargetConfigProto) ProtoReflect() protoreflect.Message

func (*GpuTargetConfigProto) Reset added in v2.12.0

func (x *GpuTargetConfigProto) Reset()

func (*GpuTargetConfigProto) String added in v2.12.0

func (x *GpuTargetConfigProto) String() string

type GpuTargetConfigProto_CudaComputeCapability added in v2.12.0

type GpuTargetConfigProto_CudaComputeCapability struct {
	CudaComputeCapability *CudaComputeCapabilityProto `protobuf:"bytes,2,opt,name=cuda_compute_capability,json=cudaComputeCapability,proto3,oneof"`
}

type GpuTargetConfigProto_RocmComputeCapability added in v2.12.0

type GpuTargetConfigProto_RocmComputeCapability struct {
	RocmComputeCapability *RocmComputeCapabilityProto `protobuf:"bytes,3,opt,name=rocm_compute_capability,json=rocmComputeCapability,proto3,oneof"`
}

type RocmComputeCapabilityProto added in v2.12.0

type RocmComputeCapabilityProto struct {
	GcnArchName string `protobuf:"bytes,1,opt,name=gcn_arch_name,json=gcnArchName,proto3" json:"gcn_arch_name,omitempty"`
	// contains filtered or unexported fields
}

func (*RocmComputeCapabilityProto) Descriptor deprecated added in v2.12.0

func (*RocmComputeCapabilityProto) Descriptor() ([]byte, []int)

Deprecated: Use RocmComputeCapabilityProto.ProtoReflect.Descriptor instead.

func (*RocmComputeCapabilityProto) GetGcnArchName added in v2.12.0

func (x *RocmComputeCapabilityProto) GetGcnArchName() string

func (*RocmComputeCapabilityProto) ProtoMessage added in v2.12.0

func (*RocmComputeCapabilityProto) ProtoMessage()

func (*RocmComputeCapabilityProto) ProtoReflect added in v2.12.0

func (*RocmComputeCapabilityProto) Reset added in v2.12.0

func (x *RocmComputeCapabilityProto) Reset()

func (*RocmComputeCapabilityProto) String added in v2.12.0

func (x *RocmComputeCapabilityProto) String() string

type TensorDescriptorProto

type TensorDescriptorProto = protobuf.TensorDescriptorProto

type TensorDescriptorProto_DataLayout

type TensorDescriptorProto_DataLayout = protobuf.TensorDescriptorProto_DataLayout

type TensorDescriptorProto_FilterLayout

type TensorDescriptorProto_FilterLayout = protobuf.TensorDescriptorProto_FilterLayout

Jump to

Keyboard shortcuts

? : This menu
/ : Search site
f or F : Jump to
y or Y : Canonical URL