X-KANeRF/xKANeRF/xKAN/laguerre_kan.py at main · lif314/X-KANeRF

History

1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

24

25

26

27

28

29

30

31

32

33

34

35

36

37

38

39

40

41

42

43

44

45

46

47

48

49

50

51

52

53

54

55

56

57

58

59

60

61

62

63

64

65

66

67

68

69

70

71

72

73

74

75

76

77

78

import torch

import torch.nn as nn

from typing import List

# code modified from https://github.com/Boris-73-TA/OrthogPolyKANs

class LaguerreKANLayer(nn.Module):

def __init__(self, input_dim, output_dim, degree, alpha):

super(LaguerreKANLayer, self).__init__()

self.input_dim = input_dim

self.output_dim = output_dim

self.degree = degree

self.alpha = alpha # Alpha parameter for generalized Laguerre polynomials

# Initialize coefficients for the Laguerre polynomials

self.laguerre_coeffs = nn.Parameter(torch.empty(input_dim, output_dim, degree + 1))

nn.init.normal_(self.laguerre_coeffs, mean=0.0, std=1 / (input_dim * (degree + 1)))

def forward(self, x):

x = x.view(-1, self.input_dim) # Reshape to (batch_size, input_dim)

x = torch.tanh(x) # Normalize input x to [-1, 1] for stability in polynomial calculation

# Initialize Laguerre polynomial tensors

laguerre = torch.zeros(x.size(0), self.input_dim, self.degree + 1, device=x.device)

laguerre[:, :, 0] = 1 # L_0^alpha(x) = 1

if self.degree > 0:

laguerre[:, :, 1] = 1 + self.alpha - x # L_1^alpha(x) = 1 + alpha - x

for k in range(2, self.degree + 1):

# Compute Laguerre polynomials using the generalized recurrence relation

term1 = ((2 * (k-1) + 1 + self.alpha - x) * laguerre[:, :, k - 1].clone())

term2 = (k - 1 + self.alpha) * laguerre[:, :, k - 2].clone()

laguerre[:, :, k] = (term1 - term2) / (k)

# Normalize the polynomial outputs to prevent runaway values

#laguerre = torch.tanh(laguerre)

# Compute the Laguerre interpolation

y = torch.einsum('bid,iod->bo', laguerre, self.laguerre_coeffs) # shape = (batch_size, output_dim)

y = y.view(-1, self.output_dim)

return y

# To avoid gradient vanishing caused by tanh

class LaguerreKANLayerNorm(nn.Module):

def __init__(self, input_dim, output_dim, degree, alpha):

super(LaguerreKANLayerNorm, self).__init__()

self.layer = LaguerreKANLayer(input_dim=input_dim, output_dim=output_dim, degree=degree, alpha=alpha)

self.layer_norm = nn.LayerNorm(output_dim) # To avoid gradient vanishing caused by tanh

def forward(self, x):

x = self.layer(x)

x = self.layer_norm(x)

return x

class Laguerre_KAN(nn.Module):

def __init__(

self,

layers_hidden: List[int],

degree: int = 3,

alpha: float = -0.5,

grid_size: int = 8, # placeholder

spline_order=0. # placeholder

) -> None:

super().__init__()

self.layers = nn.ModuleList([

LaguerreKANLayerNorm(

input_dim=in_dim,

output_dim=out_dim,

degree=degree,

alpha=alpha

) for in_dim, out_dim in zip(layers_hidden[:-1], layers_hidden[1:])

])

def forward(self, x):

for layer in self.layers:

x = layer(x)

return x

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

laguerre_kan.py

laguerre_kan.py

Files

laguerre_kan.py

Latest commit

History

laguerre_kan.py

File metadata and controls