vollo-ids-example/model.py at main · MyrtleSoftware/vollo-ids-example · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
import torch
import vollo_torch
import vollo_compiler

from torch import nn
from vollo_torch import nn as vv


def eval(fn):

    @torch.no_grad()
    def inner(self, *args, **kwargs):
        was_training = self.training
        self.eval()
        out = fn(self, *args, **kwargs)
        self.train(was_training)
        return out

    return inner


class Net(nn.Module):
    def __init__(
        self,
        input_size,
        hid: int = 64,
        dropout: float = 0.1,
    ):

        self.input_size = input_size

        super().__init__()

        kwargs = {
            "hidden_size": hid,
            "batch_first": True,
        }

        self.post = nn.Sequential(
            vv.LSTM(input_size=input_size, **kwargs),
            nn.Dropout(p=dropout),
            vv.LSTM(input_size=hid, **kwargs),
            nn.Dropout(p=dropout),
            nn.Linear(hid, 1),
        )

    def forward(self, x):
        """
        Args:
            x: [B, T, H]

        Returns:
            r: [B, T, 1] on interval [0, 1]
        """

        x = self.post(x)

        if self.training:
            return torch.sigmoid(x)

        return torch.where(x > 0, 1, 0)

    @eval
    def compile(self, num_cores=1, block_size=16):

        config = vollo_compiler.Config.ip_core(
            num_cores=num_cores, block_size=block_size
        )

        dummy = torch.randn(1, 1, self.input_size)

        model, _ = vollo_torch.fx.prepare_shape(self, dummy)

        nnir, _ = vollo_torch.fx.nnir.to_nnir(model).streaming_transform(1)

        program = nnir.to_program(config)

        vm = program.to_vm()

        # The streaming transform removes the time-dimension
        vm.run(dummy[:, 0, :].detach().numpy())

        stats = {
            "cycle_count": vm.cycle_count(),
            "compute_latency/us": vm.compute_duration_us(),
        }

        return nnir, program, stats