Memory Constrained SchedulingΒΆ

from b_asic.architecture import Architecture, Memory, ProcessingElement
from b_asic.core_operations import ConstantMultiplication
from b_asic.fft_operations import R2Butterfly
from b_asic.list_schedulers import HybridScheduler
from b_asic.schedule import Schedule
from b_asic.scheduler import ASAPScheduler
from b_asic.sfg_generators import radix_2_dif_fft
from b_asic.special_operations import Input, Output

sfg = radix_2_dif_fft(points=16)

The SFG is

sfg
%3 in0 in0 r2bfly0 r2bfly0 in0->r2bfly0 0 r2bfly1 r2bfly1 r2bfly0->r2bfly1 0 0 r2bfly2 r2bfly2 r2bfly0->r2bfly2 0 1 in1 in1 r2bfly15 r2bfly15 in1->r2bfly15 0 cmul8 cmul8 r2bfly15->cmul8 1 r2bfly14 r2bfly14 r2bfly15->r2bfly14 0 0 in2 in2 r2bfly22 r2bfly22 in2->r2bfly22 0 r2bfly21 r2bfly21 r2bfly22->r2bfly21 0 0 cmul16 cmul16 r2bfly22->cmul16 1 in3 in3 r2bfly29 r2bfly29 in3->r2bfly29 0 cmul5 cmul5 r2bfly29->cmul5 1 r2bfly28 r2bfly28 r2bfly29->r2bfly28 0 0 in4 in4 r2bfly31 r2bfly31 in4->r2bfly31 0 r2bfly31->r2bfly1 1 0 cmul0 cmul0 r2bfly31->cmul0 1 in5 in5 r2bfly13 r2bfly13 in5->r2bfly13 0 cmul9 cmul9 r2bfly13->cmul9 1 r2bfly13->r2bfly14 1 0 in6 in6 r2bfly23 r2bfly23 in6->r2bfly23 0 r2bfly23->r2bfly21 1 0 cmul15 cmul15 r2bfly23->cmul15 1 in7 in7 r2bfly30 r2bfly30 in7->r2bfly30 0 cmul6 cmul6 r2bfly30->cmul6 1 r2bfly30->r2bfly28 1 0 in8 in8 in8->r2bfly0 1 in9 in9 in9->r2bfly15 1 in10 in10 in10->r2bfly22 1 in11 in11 in11->r2bfly29 1 in12 in12 in12->r2bfly31 1 in13 in13 in13->r2bfly13 1 in14 in14 in14->r2bfly23 1 in15 in15 in15->r2bfly30 1 out0 out0 r2bfly25 r2bfly25 r2bfly25->out0 0 out8 out8 r2bfly25->out8 1 out1 out1 r2bfly11 r2bfly11 r2bfly11->out1 0 out9 out9 r2bfly11->out9 1 out2 out2 r2bfly18 r2bfly18 r2bfly18->out2 0 out10 out10 r2bfly18->out10 1 out3 out3 r2bfly5 r2bfly5 r2bfly5->out3 0 out11 out11 r2bfly5->out11 1 out4 out4 r2bfly26 r2bfly26 r2bfly26->out4 0 out12 out12 r2bfly26->out12 1 out5 out5 r2bfly12 r2bfly12 r2bfly12->out5 0 out13 out13 r2bfly12->out13 1 out6 out6 r2bfly19 r2bfly19 r2bfly19->out6 0 out14 out14 r2bfly19->out14 1 out7 out7 r2bfly6 r2bfly6 r2bfly6->out7 0 out15 out15 r2bfly6->out15 1 r2bfly20 r2bfly20 r2bfly1->r2bfly20 0 1 r2bfly24 r2bfly24 r2bfly1->r2bfly24 0 0 r2bfly3 r2bfly3 r2bfly2->r2bfly3 0 0 r2bfly4 r2bfly4 r2bfly2->r2bfly4 0 1 cmul0->r2bfly2 1 r2bfly3->r2bfly11 0 0 r2bfly3->r2bfly12 0 1 r2bfly4->r2bfly5 0 0 r2bfly4->r2bfly6 0 1 cmul1 cmul1 cmul1->r2bfly4 1 cmul2 cmul2 cmul2->r2bfly6 1 r2bfly7 r2bfly7 r2bfly7->r2bfly5 1 0 r2bfly7->cmul2 1 cmul3 cmul3 cmul3->r2bfly7 0 cmul4 cmul4 cmul4->r2bfly7 1 r2bfly8 r2bfly8 r2bfly8->cmul4 1 r2bfly9 r2bfly9 r2bfly8->r2bfly9 1 0 cmul5->r2bfly8 0 cmul6->r2bfly8 1 r2bfly9->r2bfly11 1 0 cmul7 cmul7 r2bfly9->cmul7 1 r2bfly10 r2bfly10 r2bfly10->cmul3 1 r2bfly10->r2bfly9 0 0 cmul7->r2bfly12 1 cmul8->r2bfly10 0 cmul9->r2bfly10 1 r2bfly16 r2bfly16 r2bfly14->r2bfly16 0 0 cmul10 cmul10 r2bfly14->cmul10 1 r2bfly16->r2bfly25 1 0 cmul14 cmul14 r2bfly16->cmul14 1 r2bfly17 r2bfly17 cmul10->r2bfly17 0 r2bfly17->r2bfly18 1 0 cmul12 cmul12 r2bfly17->cmul12 1 cmul11 cmul11 cmul11->r2bfly17 1 cmul12->r2bfly19 1 r2bfly20->r2bfly18 0 0 r2bfly20->r2bfly19 0 1 cmul13 cmul13 cmul13->r2bfly20 1 r2bfly21->cmul13 1 r2bfly21->r2bfly24 1 0 r2bfly24->r2bfly25 0 0 r2bfly24->r2bfly26 0 1 cmul14->r2bfly26 1 r2bfly27 r2bfly27 cmul15->r2bfly27 1 r2bfly27->r2bfly3 1 0 r2bfly27->cmul1 1 cmul16->r2bfly27 0 r2bfly28->r2bfly16 1 0 r2bfly28->cmul11 1


Set latencies and execution times.

sfg.set_latency_of_type(R2Butterfly, 3)
sfg.set_latency_of_type(ConstantMultiplication, 2)
sfg.set_execution_time_of_type(R2Butterfly, 1)
sfg.set_execution_time_of_type(ConstantMultiplication, 1)

# # %%
# Generate an ASAP schedule for reference
schedule1 = Schedule(sfg, scheduler=ASAPScheduler())
schedule1.show()
memory constrained scheduling

Generate a PE constrained HybridSchedule

resources = {R2Butterfly.type_name(): 1, ConstantMultiplication.type_name(): 1}
schedule2 = Schedule(sfg, scheduler=HybridScheduler(resources))
schedule2.show()
memory constrained scheduling
direct, mem_vars = schedule2.get_memory_variables().split_on_length()
print("Max read ports:", mem_vars.read_ports_bound())
print("Max write ports:", mem_vars.write_ports_bound())
Max read ports: 3
Max write ports: 3
operations = schedule2.get_operations()
bfs = operations.get_by_type_name(R2Butterfly.type_name())
bfs.show(title="R2Butterfly executions")
const_muls = operations.get_by_type_name(ConstantMultiplication.type_name())
const_muls.show(title="ConstMul executions")
inputs = operations.get_by_type_name(Input.type_name())
inputs.show(title="Input executions")
outputs = operations.get_by_type_name(Output.type_name())
outputs.show(title="Output executions")

bf_pe = ProcessingElement(bfs, entity_name="bf")
mul_pe = ProcessingElement(const_muls, entity_name="mul")

pe_in = ProcessingElement(inputs, entity_name='input')
pe_out = ProcessingElement(outputs, entity_name='output')

mem_vars = schedule2.get_memory_variables()
mem_vars.show(title="All memory variables")
direct, mem_vars = mem_vars.split_on_length()
mem_vars.show(title="Non-zero time memory variables")
mem_vars_set = mem_vars.split_on_ports(
    read_ports=1, write_ports=1, total_ports=2, strategy="greedy_graph_color"
)
  • R2Butterfly executions
  • ConstMul executions
  • Input executions
  • Output executions
  • All memory variables
  • Non-zero time memory variables
memories = []
for i, mem in enumerate(mem_vars_set):
    memory = Memory(mem, memory_type="RAM", entity_name=f"memory{i}")
    memories.append(memory)
    mem.show(title=f"{memory.entity_name}")
    memory.assign("greedy_graph_color")
    memory.show_content(title=f"Assigned {memory.entity_name}")

direct.show(title="Direct interconnects")
  • memory0
  • Assigned memory0
  • memory1
  • Assigned memory1
  • memory2
  • Assigned memory2
  • Direct interconnects
arch = Architecture(
    {bf_pe, mul_pe, pe_in, pe_out},
    memories,
    direct_interconnects=direct,
)
arch
%3 cluster_memories Memories cluster_pes Processing Elements cluster_io I/O memory0 in0 memory0: (RAM, 5 cells) out0 memory0out0_branch memory0:out0->memory0out0_branch memory1 in0 memory1: (RAM, 5 cells) out0 memory1out0_branch memory1:out0->memory1out0_branch memory2 in0 memory2: (RAM, 2 cells) out0 memory2out0_branch memory2:out0->memory2out0_branch mul in0 mul out0 mulout0_branch mul:out0->mulout0_branch bf in0 in1 bf out0 out1 bfout1_branch bf:out1->bfout1_branch bfout0_branch bf:out0->bfout0_branch input input out0 inputout0_branch input:out0->inputout0_branch output in0 output bf_in1_mux in0 in1 in2 in3 bf_in1_mux out0 bf_in1_mux:out0->bf:in1 memory0_in0_mux in0 in1 in2 in3 memory0_in0_mux out0 memory0_in0_mux:out0->memory0:in0 memory1_in0_mux in0 in1 in2 in3 memory1_in0_mux out0 memory1_in0_mux:out0->memory1:in0 memory2_in0_mux in0 in1 in2 in3 memory2_in0_mux out0 memory2_in0_mux:out0->memory2:in0 bf_in0_mux in0 in1 in2 in3 in4 bf_in0_mux out0 bf_in0_mux:out0->bf:in0 output_in0_mux in0 in1 in2 in3 output_in0_mux out0 output_in0_mux:out0->output:in0 inputout0_branch->bf_in1_mux:in1 8 inputout0_branch->memory0_in0_mux:in1 5 inputout0_branch->memory1_in0_mux:in1 1 inputout0_branch->memory2_in0_mux:in1 2 bfout1_branch->mul:in0 17 bfout1_branch->memory0_in0_mux:in0 6 bfout1_branch->memory1_in0_mux:in0 6 bfout1_branch->memory2_in0_mux:in0 3 mulout0_branch->memory0_in0_mux:in2 7 mulout0_branch->memory1_in0_mux:in2 7 mulout0_branch->memory2_in0_mux:in2 1 mulout0_branch->bf_in0_mux:in0 2 bfout0_branch->memory0_in0_mux:in3 12 bfout0_branch->memory1_in0_mux:in3 13 bfout0_branch->memory2_in0_mux:in3 1 bfout0_branch->bf_in0_mux:in2 3 bfout0_branch->output_in0_mux:in2 3 memory0out0_branch->bf_in1_mux:in0 10 memory0out0_branch->bf_in0_mux:in4 14 memory0out0_branch->output_in0_mux:in0 6 memory2out0_branch->bf_in1_mux:in2 1 memory2out0_branch->bf_in0_mux:in3 4 memory2out0_branch->output_in0_mux:in1 2 memory1out0_branch->bf_in1_mux:in3 13 memory1out0_branch->bf_in0_mux:in1 9 memory1out0_branch->output_in0_mux:in3 5


Generate another HybridSchedule but this time constrain the amount of reads and writes to reduce the amount of memories

resources = {R2Butterfly.type_name(): 1, ConstantMultiplication.type_name(): 1}
schedule3 = Schedule(
    sfg,
    scheduler=HybridScheduler(
        resources, max_concurrent_reads=2, max_concurrent_writes=2
    ),
)
schedule3.show()
memory constrained scheduling
direct, mem_vars = schedule3.get_memory_variables().split_on_length()
print("Max read ports:", mem_vars.read_ports_bound())
print("Max write ports:", mem_vars.write_ports_bound())
Max read ports: 2
Max write ports: 2
operations = schedule3.get_operations()
bfs = operations.get_by_type_name(R2Butterfly.type_name())
bfs.show(title="R2Butterfly executions")
const_muls = operations.get_by_type_name(ConstantMultiplication.type_name())
const_muls.show(title="ConstMul executions")
inputs = operations.get_by_type_name(Input.type_name())
inputs.show(title="Input executions")
outputs = operations.get_by_type_name(Output.type_name())
outputs.show(title="Output executions")

bf_pe = ProcessingElement(bfs, entity_name="bf")
mul_pe = ProcessingElement(const_muls, entity_name="mul")

pe_in = ProcessingElement(inputs, entity_name='input')
pe_out = ProcessingElement(outputs, entity_name='output')

mem_vars.show(title="Non-zero time memory variables")
mem_vars_set = mem_vars.split_on_ports(
    strategy="greedy_graph_color", read_ports=1, write_ports=1, total_ports=2
)
  • R2Butterfly executions
  • ConstMul executions
  • Input executions
  • Output executions
  • Non-zero time memory variables
memories = []
for i, mem in enumerate(mem_vars_set):
    memory = Memory(mem, memory_type="RAM", entity_name=f"memory{i}")
    memories.append(memory)
    mem.show(title=f"{memory.entity_name}")
    memory.assign("greedy_graph_color")
    memory.show_content(title=f"Assigned {memory.entity_name}")

direct.show(title="Direct interconnects")
  • memory0
  • Assigned memory0
  • memory1
  • Assigned memory1
  • Direct interconnects
arch = Architecture(
    {bf_pe, mul_pe, pe_in, pe_out},
    memories,
    direct_interconnects=direct,
)
arch
%3 cluster_memories Memories cluster_pes Processing Elements cluster_io I/O memory0 in0 memory0: (RAM, 7 cells) out0 memory0out0_branch memory0:out0->memory0out0_branch memory1 in0 memory1: (RAM, 7 cells) out0 memory1out0_branch memory1:out0->memory1out0_branch bf in0 in1 bf out0 out1 bfout0_branch bf:out0->bfout0_branch bfout1_branch bf:out1->bfout1_branch mul in0 mul out0 mulout0_branch mul:out0->mulout0_branch input input out0 inputout0_branch input:out0->inputout0_branch output in0 output bf_in0_mux in0 in1 in2 in3 bf_in0_mux out0 bf_in0_mux:out0->bf:in0 bf_in1_mux in0 in1 in2 in3 bf_in1_mux out0 bf_in1_mux:out0->bf:in1 output_in0_mux in0 in1 in2 output_in0_mux out0 output_in0_mux:out0->output:in0 memory1_in0_mux in0 in1 in2 in3 memory1_in0_mux out0 memory1_in0_mux:out0->memory1:in0 memory0_in0_mux in0 in1 in2 in3 memory0_in0_mux out0 memory0_in0_mux:out0->memory0:in0 mul_in0_mux in0 in1 in2 mul_in0_mux out0 mul_in0_mux:out0->mul:in0 bfout0_branch->bf_in0_mux:in2 10 bfout0_branch->output_in0_mux:in1 5 bfout0_branch->memory1_in0_mux:in3 9 bfout0_branch->memory0_in0_mux:in3 8 memory1out0_branch->bf_in0_mux:in3 11 memory1out0_branch->bf_in1_mux:in3 9 memory1out0_branch->output_in0_mux:in0 5 memory1out0_branch->mul_in0_mux:in2 7 memory0out0_branch->bf_in0_mux:in0 9 memory0out0_branch->bf_in1_mux:in0 10 memory0out0_branch->output_in0_mux:in2 6 memory0out0_branch->mul_in0_mux:in0 8 mulout0_branch->bf_in0_mux:in1 2 mulout0_branch->bf_in1_mux:in2 5 mulout0_branch->memory1_in0_mux:in0 5 mulout0_branch->memory0_in0_mux:in0 5 inputout0_branch->bf_in1_mux:in1 8 inputout0_branch->memory1_in0_mux:in1 5 inputout0_branch->memory0_in0_mux:in1 3 bfout1_branch->memory1_in0_mux:in2 13 bfout1_branch->memory0_in0_mux:in2 17 bfout1_branch->mul_in0_mux:in1 2


Total running time of the script: (0 minutes 15.660 seconds)

Gallery generated by Sphinx-Gallery