-
Notifications
You must be signed in to change notification settings - Fork 0
/
params.yaml
74 lines (74 loc) · 2.6 KB
/
params.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
# Tagging of metrics and verification aggregation to assist filtering experiment
# sweeps
tag: ""
# Global seed to make evaluation reproducible
seed: 12
# Number of calibration passes to be applied to the model before export
calibration_passes: 32
# Model configuration section
model:
# Number of attention heads
num_heads: 12
# Number of attention block "layers"
num_layers: 1
# Enables/disables bias on linear layers
bias: True
# Size of the input/output embedding dimension
emb_dim: 384
# Size of the MLP layer dimension
mlp_dim: 1536
# Length of the input sequence, i.e., context size
seq_len: 512
# Number of bits to use for quantized representation
bits: 2
# Type of normalization layer to use in the transformer blocks
# Options are: layer-norm, batch-norm and none
norm: none
# Type of attention mask to use
# Options are: none, causal or random
mask: none
# Type of positional encoding to use at the input
# Options are: none, sinusoidal, binary, learned
positional_encoding: binary
# Model to ONNX export hyperparameters
export:
# Version of the default ONNX opset
opset_version: 14
# Apply the constant-folding optimization
do_constant_folding: true
# FINN build configuration
build:
# Directory to store the build outputs
output_dir: build
# Run synthesis to generate a .dcp for the stitched-IP output product
stitched_ip_gen_dcp: False
# Target clock period, i.e., inverse of target frequency
synth_clk_period_ns: 10.0
# Board to target with the build
board: RFSoC2x2
# Target shell flow: 'vivado_zynq' or 'vitis_alveo'
shell_flow_type: vivado_zynq
# Path to folding configuration file
folding_config_file: folding.yaml
# Path to layer implementation style specialization config
specialize_layers_config_file: specialize_layers.json
# Force the implementation of standalone thresholds to be able to use RTL
# implementation of the MVU
standalone_thresholds: True
# Maximum bit-width of quantizers converted to multi-thresholds
max_multithreshold_bit_width: 16
# Maximum width of MVAU stream per PE
mvau_wwidth_max: 2048
# FIFO nodes with depth larger than 32768 will be split
split_large_fifos: true
# # Optional: Start the build from a specific step
# start_step: "step_tidy_up_pre_attention"
# # Optional: Stop the build after a specific step
# stop_step: "step_hw_ipgen"
# Metrics aggregation configuration
metrics:
# Path to the report file to be summarized
# Note: remember to adjust the build directory when changing the config above
report: "build/report/post_synth_resources.json"
# Filter the report rows
filter: "(top)"