Struct GpuCircuitCache

Source

pub struct GpuCircuitCache { /* private fields */ }

Implementations§

Source §

impl GpuCircuitCache

Source

pub fn provider(&self) -> &Arc<CudaKernelProvider>

Source

pub fn var_log_weights_mut( &mut self, ) -> (&mut TrackedCudaSlice<f64>, &mut TrackedCudaSlice<f64>)

Source

pub fn new( provider: &Arc<CudaKernelProvider>, config: GpuCircuitCacheConfig, ) -> Result<Self>

Source

pub fn lookup_or_insert(&mut self, key: u64) -> Result<GpuCacheLookup>

Source

pub fn claim_slot(&mut self, key: u64) -> Result<GpuCircuitCacheHandle>

Source

pub fn store_from_xgcf( &mut self, handle: &mut GpuCircuitCacheHandle, xgcf: &GpuXgcf, ) -> Result<()>

Source

pub fn store_weights( &mut self, handle: &GpuCircuitCacheHandle, weights_true: &TrackedCudaSlice<f64>, weights_false: &TrackedCudaSlice<f64>, ) -> Result<()>

Source

pub fn overwrite_weights( &mut self, handle: &GpuCircuitCacheHandle, weights_true: &TrackedCudaSlice<f64>, weights_false: &TrackedCudaSlice<f64>, ) -> Result<()>

Source

pub fn store_free_var_mask( &mut self, handle: &GpuCircuitCacheHandle, mask: &TrackedCudaSlice<u8>, ) -> Result<()>

Source

pub fn eval_log_wmc_device_inplace( &mut self, handle: &GpuCircuitCacheHandle, out_log_z: &mut TrackedCudaSlice<f64>, ) -> Result<()>

Source

pub fn eval_log_wmc_device_only( &mut self, handle: &GpuCircuitCacheHandle, out_log_z: &mut TrackedCudaSlice<f64>, ) -> Result<()>

Source

pub fn eval_grads_inplace( &mut self, handle: &GpuCircuitCacheHandle, ) -> Result<()>

Source

pub fn eval_grads_inplace_fused( &mut self, handle: &GpuCircuitCacheHandle, ) -> Result<()>

Like [eval_grads_inplace] but replaces the per-level backward loop with a single launch of xgcf_backward_all_levels_cached, and omits the trailing device().synchronize() so that the caller can batch multiple queries before syncing.

Auto Trait Implementations§

§

impl Freeze for GpuCircuitCache

§

impl RefUnwindSafe for GpuCircuitCache

§

impl Send for GpuCircuitCache

§

impl Sync for GpuCircuitCache

§

impl Unpin for GpuCircuitCache

§

impl UnsafeUnpin for GpuCircuitCache

§

impl UnwindSafe for GpuCircuitCache

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T, U> TryFrom for T
where U: Into<T>,

Source §

type Error = Infallible

The type returned in the event of a conversion error.

Source §

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

Source §

impl<T, U> TryInto for T
where U: TryFrom<T>,

Source §

type Error = >::Error

The type returned in the event of a conversion error.

Source §

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

§

GpuCircuitCache

Struct GpuCircuitCache Copy item path

Implementations§

impl GpuCircuitCache

pub fn provider(&self) -> &Arc<CudaKernelProvider>

pub fn var_log_weights_mut( &mut self, ) -> (&mut TrackedCudaSlice<f64>, &mut TrackedCudaSlice<f64>)

pub fn grad_true(&self) -> &TrackedCudaSlice<f64>

pub fn grad_false(&self) -> &TrackedCudaSlice<f64>

pub fn values(&self) -> &TrackedCudaSlice<f64>

pub fn meta_num_nodes_device(&self) -> &TrackedCudaSlice<u32>

pub fn meta_num_levels_device(&self) -> &TrackedCudaSlice<u32>

pub fn meta_root_device(&self) -> &TrackedCudaSlice<u32>

pub fn meta_max_var_device(&self) -> &TrackedCudaSlice<u32>

pub fn num_slots(&self) -> u32

pub fn new( provider: &Arc<CudaKernelProvider>, config: GpuCircuitCacheConfig, ) -> Result<Self>

pub fn lookup_or_insert(&mut self, key: u64) -> Result<GpuCacheLookup>

pub fn claim_slot(&mut self, key: u64) -> Result<GpuCircuitCacheHandle>

pub fn store_from_xgcf( &mut self, handle: &mut GpuCircuitCacheHandle, xgcf: &GpuXgcf, ) -> Result<()>

pub fn store_weights( &mut self, handle: &GpuCircuitCacheHandle, weights_true: &TrackedCudaSlice<f64>, weights_false: &TrackedCudaSlice<f64>, ) -> Result<()>

pub fn overwrite_weights( &mut self, handle: &GpuCircuitCacheHandle, weights_true: &TrackedCudaSlice<f64>, weights_false: &TrackedCudaSlice<f64>, ) -> Result<()>

pub fn store_free_var_mask( &mut self, handle: &GpuCircuitCacheHandle, mask: &TrackedCudaSlice<u8>, ) -> Result<()>

pub fn eval_log_wmc_device_inplace( &mut self, handle: &GpuCircuitCacheHandle, out_log_z: &mut TrackedCudaSlice<f64>, ) -> Result<()>

pub fn eval_log_wmc_device_only( &mut self, handle: &GpuCircuitCacheHandle, out_log_z: &mut TrackedCudaSlice<f64>, ) -> Result<()>

pub fn eval_grads_inplace( &mut self, handle: &GpuCircuitCacheHandle, ) -> Result<()>

pub fn eval_grads_inplace_fused( &mut self, handle: &GpuCircuitCacheHandle, ) -> Result<()>

Auto Trait Implementations§

impl Freeze for GpuCircuitCache

impl RefUnwindSafe for GpuCircuitCache

impl Send for GpuCircuitCache

impl Sync for GpuCircuitCache

impl Unpin for GpuCircuitCache

impl UnsafeUnpin for GpuCircuitCache

impl UnwindSafe for GpuCircuitCache

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<T> Allocation for Twhere T: RefUnwindSafe + Send + Sync,

Struct GpuCircuitCache

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<T> Allocation for T
where T: RefUnwindSafe + Send + Sync,