PyPI - accelforge - Versions diffs - 0.0.1__py3-none-any.whl - Mend

accelforge 0.0.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (258) hide show

accelforge/__init__.py +21 -0
accelforge/_accelerated_imports.py +16 -0
accelforge/_deprecate/_simanneal/evalmapping.py +271 -0
accelforge/_deprecate/_simanneal/mapspaceglobals.py +298 -0
accelforge/_deprecate/_simanneal/simanneal.py +666 -0
accelforge/_deprecate/_simanneal/tracking.py +105 -0
accelforge/_deprecate/_simanneal/wrappers.py +218 -0
accelforge/_deprecate/_simanneal2/__init__.py +7 -0
accelforge/_deprecate/_simanneal2/simanneal.py +493 -0
accelforge/_deprecate/_simanneal2/tracking.py +116 -0
accelforge/_deprecate/compatibility_util.py +181 -0
accelforge/_deprecate/layerdeduplication/__init__.py +2 -0
accelforge/_deprecate/layerdeduplication/group_similar_einsums.py +160 -0
accelforge/_deprecate/layerdeduplication/grouped_einsums.py +84 -0
accelforge/_deprecate/mapping_filter_tags/__init__.py +2 -0
accelforge/_deprecate/mapping_filter_tags/ffmt.py +212 -0
accelforge/_deprecate/mapping_filter_tags/onesplit.py +24 -0
accelforge/_deprecate/mapping_filter_tags/util.py +24 -0
accelforge/_deprecate/tags.py +69 -0
accelforge/_deprecate/viz/__init__.py +0 -0
accelforge/_deprecate/viz/interactive.py +159 -0
accelforge/_deprecate/viz/reservationtree.py +307 -0
accelforge/_deprecate/viz/ski_slope.py +88 -0
accelforge/_version.py +15 -0
accelforge/examples.py +39 -0
accelforge/frontend/__init__.py +10 -0
accelforge/frontend/_binding.py +129 -0
accelforge/frontend/_workload_isl/__init__.py +2 -0
accelforge/frontend/_workload_isl/_isl.py +149 -0
accelforge/frontend/_workload_isl/_symbolic.py +141 -0
accelforge/frontend/arch copy.py +1544 -0
accelforge/frontend/arch.py +1642 -0
accelforge/frontend/config.py +63 -0
accelforge/frontend/mapper/__init__.py +5 -0
accelforge/frontend/mapper/ffm.py +126 -0
accelforge/frontend/mapper/mapper.py +7 -0
accelforge/frontend/mapper/metrics.py +30 -0
accelforge/frontend/mapping/__init__.py +1 -0
accelforge/frontend/mapping/mapping.py +1736 -0
accelforge/frontend/model.py +14 -0
accelforge/frontend/renames.py +150 -0
accelforge/frontend/spec copy.py +230 -0
accelforge/frontend/spec.py +301 -0
accelforge/frontend/variables.py +12 -0
accelforge/frontend/workload.py +952 -0
accelforge/mapper/FFM/__init__.py +9 -0
accelforge/mapper/FFM/_join_pmappings/__init__.py +0 -0
accelforge/mapper/FFM/_join_pmappings/compatibility.py +653 -0
accelforge/mapper/FFM/_join_pmappings/compress_pmappings.py +140 -0
accelforge/mapper/FFM/_join_pmappings/join_pmappings.py +703 -0
accelforge/mapper/FFM/_join_pmappings/pmapping_dataframe.py +901 -0
accelforge/mapper/FFM/_join_pmappings/pmapping_group.py +337 -0
accelforge/mapper/FFM/_make_pmappings/contraints/__init__.py +0 -0
accelforge/mapper/FFM/_make_pmappings/contraints/constraints.py +360 -0
accelforge/mapper/FFM/_make_pmappings/make_pmapping_templates/__init__.py +1 -0
accelforge/mapper/FFM/_make_pmappings/make_pmapping_templates/make_loops.py +373 -0
accelforge/mapper/FFM/_make_pmappings/make_pmapping_templates/make_pmapping_templates.py +463 -0
accelforge/mapper/FFM/_make_pmappings/make_pmapping_templates/make_reservations.py +95 -0
accelforge/mapper/FFM/_make_pmappings/make_pmapping_templates/make_storage_order.py +382 -0
accelforge/mapper/FFM/_make_pmappings/make_pmapping_templates/make_storages.py +155 -0
accelforge/mapper/FFM/_make_pmappings/make_pmappings.py +411 -0
accelforge/mapper/FFM/_make_pmappings/make_pmappings_from_templates/__init__.py +1 -0
accelforge/mapper/FFM/_make_pmappings/make_pmappings_from_templates/make_pmappings_from_templates.py +407 -0
accelforge/mapper/FFM/_make_pmappings/make_pmappings_from_templates/make_tile_shapes.py +1681 -0
accelforge/mapper/FFM/_make_pmappings/make_pmappings_from_templates/run_model.py +170 -0
accelforge/mapper/FFM/_make_pmappings/make_pmappings_from_templates/symbol_relations.py +174 -0
accelforge/mapper/FFM/_make_pmappings/pmapper_job.py +282 -0
accelforge/mapper/FFM/_pareto_df/df_convention.py +273 -0
accelforge/mapper/FFM/_pareto_df/pareto copy.py +836 -0
accelforge/mapper/FFM/_pareto_df/pareto.py +508 -0
accelforge/mapper/FFM/data.py +61 -0
accelforge/mapper/FFM/main copy.py +236 -0
accelforge/mapper/FFM/main.py +208 -0
accelforge/mapper/FFM/mappings.py +510 -0
accelforge/mapper/FFM/pmappings.py +310 -0
accelforge/mapper/__init__.py +4 -0
accelforge/mapper.py +0 -0
accelforge/model/__init__.py +1 -0
accelforge/model/_looptree/__init__.py +0 -0
accelforge/model/_looptree/accesses.py +335 -0
accelforge/model/_looptree/capacity/__init__.py +1 -0
accelforge/model/_looptree/capacity/aggregators.py +36 -0
accelforge/model/_looptree/capacity/capacity.py +47 -0
accelforge/model/_looptree/energy.py +150 -0
accelforge/model/_looptree/equivalent_ranks.py +29 -0
accelforge/model/_looptree/latency/__init__.py +1 -0
accelforge/model/_looptree/latency/latency.py +98 -0
accelforge/model/_looptree/latency/memory.py +120 -0
accelforge/model/_looptree/latency/processors.py +92 -0
accelforge/model/_looptree/mapping_utilities.py +71 -0
accelforge/model/_looptree/reuse/__init__.py +4 -0
accelforge/model/_looptree/reuse/isl/__init__.py +1 -0
accelforge/model/_looptree/reuse/isl/des.py +59 -0
accelforge/model/_looptree/reuse/isl/isl_functions.py +374 -0
accelforge/model/_looptree/reuse/isl/mapping_to_isl/__init__.py +4 -0
accelforge/model/_looptree/reuse/isl/mapping_to_isl/analyze_mapping.py +297 -0
accelforge/model/_looptree/reuse/isl/mapping_to_isl/skews_from_mapping.py +236 -0
accelforge/model/_looptree/reuse/isl/mapping_to_isl/tiling.py +685 -0
accelforge/model/_looptree/reuse/isl/mapping_to_isl/types.py +188 -0
accelforge/model/_looptree/reuse/isl/spatial.py +260 -0
accelforge/model/_looptree/reuse/isl/temporal.py +182 -0
accelforge/model/_looptree/reuse/symbolic/__init__.py +1 -0
accelforge/model/_looptree/reuse/symbolic/symbolic copy 2.py +1346 -0
accelforge/model/_looptree/reuse/symbolic/symbolic copy.py +1408 -0
accelforge/model/_looptree/reuse/symbolic/symbolic.py +1396 -0
accelforge/model/_looptree/run.py +122 -0
accelforge/model/_looptree/types.py +26 -0
accelforge/model/_looptree/visualization/__init__.py +0 -0
accelforge/model/_looptree/visualization/occupancy.py +11 -0
accelforge/model/main.py +222 -0
accelforge/plotting/__init__.py +2 -0
accelforge/plotting/mappings.py +219 -0
accelforge/plotting/specs.py +57 -0
accelforge/util/__init__.py +4 -0
accelforge/util/_base_analysis_types.py +24 -0
accelforge/util/_basetypes.py +1089 -0
accelforge/util/_frozenset.py +36 -0
accelforge/util/_isl.py +29 -0
accelforge/util/_itertools.py +14 -0
accelforge/util/_mathfuncs.py +57 -0
accelforge/util/_parse_expressions.py +339 -0
accelforge/util/_picklecache.py +32 -0
accelforge/util/_setexpressions.py +268 -0
accelforge/util/_sympy/__init__.py +0 -0
accelforge/util/_sympy/broadcast_max.py +18 -0
accelforge/util/_visualization.py +112 -0
accelforge/util/_yaml.py +579 -0
accelforge/util/parallel.py +193 -0
accelforge-0.0.1.dist-info/METADATA +64 -0
accelforge-0.0.1.dist-info/RECORD +258 -0
accelforge-0.0.1.dist-info/WHEEL +5 -0
accelforge-0.0.1.dist-info/licenses/LICENSE +19 -0
accelforge-0.0.1.dist-info/top_level.txt +5 -0
docs/_build/html/_sources/fastfusion.frontend.mapper.rst.txt +37 -0
docs/_build/html/_sources/fastfusion.frontend.rst.txt +70 -0
docs/_build/html/_sources/fastfusion.frontend.workload.rst.txt +21 -0
docs/_build/html/_sources/fastfusion.mapper.FFM.rst.txt +37 -0
docs/_build/html/_sources/fastfusion.mapper.rst.txt +18 -0
docs/_build/html/_sources/fastfusion.rst.txt +20 -0
docs/_build/html/_sources/fastfusion.util.rst.txt +21 -0
docs/_build/html/_sources/index.rst.txt +87 -0
docs/_build/html/_sources/modules.rst.txt +7 -0
docs/_build/html/_sources/notes/citation.rst.txt +45 -0
docs/_build/html/_sources/notes/definitions.rst.txt +43 -0
docs/_build/html/_sources/notes/faqs.rst.txt +39 -0
docs/_build/html/_sources/notes/modeling/accelerator_energy_latency.rst.txt +72 -0
docs/_build/html/_sources/notes/modeling/component_energy_area.rst.txt +96 -0
docs/_build/html/_sources/notes/modeling/mapping.rst.txt +100 -0
docs/_build/html/_sources/notes/modeling.rst.txt +33 -0
docs/_build/html/_sources/notes/parsing/arithmetic_parsing.rst.txt +136 -0
docs/_build/html/_sources/notes/parsing/setexpressions.rst.txt +63 -0
docs/_build/html/_sources/notes/parsing/yaml_parsing.rst.txt +176 -0
docs/_build/html/_sources/notes/quickstart_and_installation.rst.txt +9 -0
docs/_build/html/_sources/notes/spec/architecture.rst.txt +133 -0
docs/_build/html/_sources/notes/spec/mapping.rst.txt +12 -0
docs/_build/html/_sources/notes/spec/workload.rst.txt +83 -0
docs/_build/html/_sources/notes/spec.rst.txt +36 -0
docs/source/_ext/include_attrs.py +213 -0
docs/source/_ext/include_docstring.py +364 -0
docs/source/_ext/include_functions.py +154 -0
docs/source/_ext/include_notebook.py +131 -0
docs/source/_ext/include_yaml.py +119 -0
docs/source/_ext/inherited_attributes.py +222 -0
docs/source/_ext/paths.py +4 -0
docs/source/conf.py +79 -0
examples/arches/compute_in_memory/_include.yaml +74 -0
examples/arches/compute_in_memory/_include_functions.py +229 -0
examples/arches/compute_in_memory/_load_spec.py +57 -0
examples/arches/compute_in_memory/components/c2c_multiplier.py +181 -0
examples/arches/compute_in_memory/components/dac_c2c_r2r.py +605 -0
examples/arches/compute_in_memory/components/misc.py +195 -0
examples/arches/compute_in_memory/components/util/bit_functions.py +51 -0
examples/arches/compute_in_memory/components/zero_comparator.py +92 -0
examples/arches/compute_in_memory/isaac.yaml +233 -0
examples/arches/compute_in_memory/memory_cells/ecram_demo.yaml +63 -0
examples/arches/compute_in_memory/memory_cells/rram_example.yaml +63 -0
examples/arches/compute_in_memory/memory_cells/rram_isaac_isca_2016.yaml +64 -0
examples/arches/compute_in_memory/memory_cells/rram_neurosim_default.yaml +63 -0
examples/arches/compute_in_memory/memory_cells/rram_raella_isca_2023.yaml +70 -0
examples/arches/compute_in_memory/memory_cells/rram_wan_nature_2022.yaml +63 -0
examples/arches/compute_in_memory/memory_cells/sram_colonnade_jssc_2021.yaml +63 -0
examples/arches/compute_in_memory/memory_cells/sram_example.yaml +63 -0
examples/arches/compute_in_memory/memory_cells/sram_jia_jssc_2020.yaml +63 -0
examples/arches/compute_in_memory/memory_cells/sram_sinangil_jssc_2021.yaml +63 -0
examples/arches/compute_in_memory/memory_cells/sram_wang_vlsi_2022.yaml +63 -0
examples/arches/compute_in_memory/wang_vlsi_2022.yaml +289 -0
examples/arches/eyeriss.yaml +68 -0
examples/arches/fanout_variations/at_glb.yaml +31 -0
examples/arches/fanout_variations/at_glb_with_fanout_node.yaml +34 -0
examples/arches/fanout_variations/at_mac.yaml +31 -0
examples/arches/fanout_variations/at_mac_with_constraints.yaml +38 -0
examples/arches/fanout_variations/at_mac_with_fanout_node.yaml +34 -0
examples/arches/nvdla.yaml +47 -0
examples/arches/simple.yaml +28 -0
examples/arches/tpu_v4i.yaml +67 -0
examples/mappings/unfused_matmuls_to_simple.yaml +33 -0
examples/misc/component_annotated.yaml +33 -0
examples/workloads/gpt3_6.7B.yaml +124 -0
examples/workloads/matmuls.yaml +20 -0
examples/workloads/mobilenet_28.yaml +81 -0
examples/workloads/mobilenet_various_separate.yaml +106 -0
examples/workloads/three_matmuls_annotated.yaml +59 -0
notebooks/.ipynb_checkpoints/fastfusion_arch_study_michael-checkpoint.ipynb +359 -0
notebooks/compute_in_memory/_scripts.py +339 -0
notebooks/compute_in_memory/isaac.guide.ipynb +270 -0
notebooks/compute_in_memory/wang_vlsi_2022.ipynb +602 -0
notebooks/paths.py +4 -0
notebooks/tutorials/.ipynb_checkpoints/1_FFM-checkpoint.ipynb +3110 -0
notebooks/tutorials/FFM.ipynb +3498 -0
notebooks/tutorials/_include.py +48 -0
notebooks/tutorials/component_energy_area.ipynb +363 -0
tests/Q_mapping.yaml +38 -0
tests/__init__.py +0 -0
tests/conv.mapping.yaml +27 -0
tests/conv.workload.yaml +13 -0
tests/conv_sym.mapping.yaml +43 -0
tests/copy.mapping.yaml +35 -0
tests/copy.workload.yaml +15 -0
tests/distribuffers/__init__.py +0 -0
tests/distribuffers/multicast/test_cases.yaml +482 -0
tests/distribuffers/spec/binding/valid_bindings.yaml +97 -0
tests/distribuffers/spec/distributed.yaml +100 -0
tests/distribuffers/spec/logical_arch.yaml +32 -0
tests/distribuffers/spec/physical_arch.yaml +69 -0
tests/distribuffers/test_binding.py +48 -0
tests/frontend/__init__.py +0 -0
tests/frontend/test_mapping_viz.py +52 -0
tests/mapper/__init__.py +0 -0
tests/mapper/configs/conv1d/conv1d.mapping.yaml +31 -0
tests/mapper/configs/conv1d/conv1d.workload.yaml +11 -0
tests/mapper/configs/two_conv1d/two_conv1d.expected.yaml +38 -0
tests/mapper/configs/two_conv1d/two_conv1d.mapping.yaml +54 -0
tests/mapper/configs/two_conv1d/two_conv1d.workload.yaml +19 -0
tests/mapper/test_mapping_to_isl.py +90 -0
tests/mapper/test_spatial_reuse_analysis.py +67 -0
tests/mapper/test_temporal_reuse_analysis.py +56 -0
tests/mapper/util.py +58 -0
tests/matmul.mapping.yaml +29 -0
tests/matmul.workload.yaml +12 -0
tests/matmul_spatial.mapping.yaml +44 -0
tests/mha.renames.yaml +65 -0
tests/mha.workload.yaml +67 -0
tests/mha.yaml +59 -0
tests/mha_full.workload.yaml +67 -0
tests/mobilenet.workload.yaml +35 -0
tests/mobilenet_long.workload.yaml +64 -0
tests/pmappingcache.py +24 -0
tests/processing_stage.arch.yaml +40 -0
tests/snowcat.arch.yaml +36 -0
tests/test_ffm_join_pmappings.py +106 -0
tests/test_ffm_make_pmappings.py +82 -0
tests/test_ffm_make_tile_shapes.py +49 -0
tests/test_mapper.py +100 -0
tests/test_model.py +37 -0
tests/test_plotting.py +72 -0
tests/test_processing_stage.py +46 -0
tests/test_symbolic_model.py +248 -0
tests/test_workload.py +141 -0

examples/mappings/unfused_matmuls_to_simple.yaml ADDED Viewed

@@ -0,0 +1,33 @@
+mapping:
+  nodes:
+  {% for i in range(N_EINSUMS+1) %}
+  - !Storage
+    tensors: [T{{i}}]
+    component: MainMemory
+  {% endfor %}
+  {% for i in range(N_EINSUMS) %}
+  - !Storage
+    tensors: [W{{i}}]
+    component: MainMemory
+  {% endfor %}
+  - !Temporal
+    rank_variable: m
+    tile_shape: 1
+  - !Sequential
+    nodes:
+    {% for i in range(N_EINSUMS) %}
+    - !Nested
+      nodes:
+      - !Storage
+        tensors: [T{{i}}, W{{i}}, T{{i+1}}]
+        component: GlobalBuffer
+      - !Temporal
+        rank_variable: n{{i}}
+        tile_shape: 1
+      - !Temporal
+        rank_variable: n{{i+1}}
+        tile_shape: 1
+      - !Compute
+        einsum: Matmul{{i}}
+        component: MAC
+    {% endfor %}

examples/misc/component_annotated.yaml ADDED Viewed

@@ -0,0 +1,33 @@
+# The YAML tag at the beginning of the component tells the parser what type of component
+# it is.
+!Memory
+name: GlobalBuffer
+# This component_class invokes the hwcomponents_library.SmartBufferSRAM model. The
+# component is a SRAM buffer with an address register that is updated on every
+# access to queue up the next data.
+component_class: SmartBufferSRAM
+# Fields can be parsed as expressions. The size field is given in bits, and we write
+# here that it is 512 × 32 bits.
+size: 512 * 32
+# Sometimes, hwcomponents models require additional attributes that are not part of the
+# accelforge spec. These can be passed to the component models through the
+# extra_attributes_for_component_model field.
+extra_attributes_for_component_model:
+  depth: 512
+  width: size // depth
+  n_banks: 32
+  tech_node: 65e-9
+# Actions that the hwcomponents_library model must support. All action attributes that
+# can are passed to the model's appropriate method (in this case, `read` or `write`).
+# The `bits_per_action` argument is special because it determines how many bits are
+# transferred by each read or write. Additionally, to pass extra attributes to the
+# component model as arguments, actions also have a extra_attributes_for_component_model
+# field.
+actions:
+- {name: read, bits_per_action: 64}
+- {name: write, bits_per_action: 64}

examples/workloads/gpt3_6.7B.yaml ADDED Viewed

@@ -0,0 +1,124 @@
+# Each tensor is shaped by a set of ranks, denoted by capital letters
+# For example: Q is shaped by (B, M, H, E)
+# We'll use lower-case letters to index into the ranks
+# For example: Q[b, m, h, e] is the tensor Q at index (b, m, h, e)
+# When making a projection list, it's equivalent to the Einsum subscript notation, so:
+# Q projection [b, m, h, e] means that b indexes into B, m indexes into M...
+# When making a projection dict, it's equivalent to the Einsum subscript/superscript notation, so:
+# K projection { B: b, M: p, H: h, E: e } means that b indexes into B, p indexes into M...
+# Renames take a tensor name and turn them into a canonical name that we can use in
+# architecture constraints. For example, we want to use the words "input", "weight", and
+# "output" to refer to the tensors of an Einsum, but the Einsum QK has no clear "weight"
+# or "input" because both Q and K are inputs. So we rename K to be weight.
+workload:
+  rank_sizes:
+    {% set BATCH_SIZE = BATCH_SIZE | default(1) %}
+    {% set N_TOKENS = N_TOKENS | default(8192) %}
+    B: {{BATCH_SIZE}}
+    P: {{N_TOKENS}}
+    M: {{N_TOKENS}}
+    H: 32
+    E: 128
+    F: 128
+    D: 4096 # = e * h
+    C: 16384
+    J: 4096
+    G: 4096
+  bits_per_value: {All: 8}
+  einsums:
+  - name: I
+    # Copy operation means that we move the input tensor from one place to another
+    # without doing computation. This lets us copy the input tensor onto the accelerator
+    # once and then use it in the Q, K, and V operations.
+    is_copy_operation: True    # no longer needed with `map` and `reduce` support
+    tensor_accesses:
+    - {name: I_in, projection: [b, m, d]}
+    - {name: I, projection: [b, m, d], output: True}
+    # operations:
+    #   map: {operation} if output = f(inputs), None if output = inputs
+    #   reduce: {operation} if output = reduce(partial_outputA, partial_outputB, ...), None if not supported
+    #   populate: {operation} if initial_output = populate, None if initial_output = first-generated partial output
+    # operations:
+    #   map: None    # Alternatives: "mul", "relu", etc.
+    #   reduce: None # Alternatives: "max", etc. Note: None means "give me whatever is the last value (mapping dependent)"
+    #   # reduce: None  with strict checking: if there is a reduce, an error is thrown.
+    #   populate: None
+    renames: {weight: Nothing, input: Inputs, output: Outputs}
+  - name: V
+    tensor_accesses:
+    - {name: I, projection: [b, m, d]}
+    - {name: WV, projection: [h, e, d], persistent: True}
+    - {name: V, projection: [b, m, h, e], output: True}
+  - name: K
+    tensor_accesses:
+    - {name: I, projection: [b, m, d]}
+    - {name: WK, projection: [h, e, d], persistent: True}
+    - {name: K, projection: [b, m, h, e], output: True}
+  - name: Q
+    tensor_accesses:
+    - {name: I, projection: [b, m, d]}
+    - {name: WQ, projection: [h, e, d], persistent: True}
+    - {name: Q, projection: [b, m, h, e], output: True}
+  - name: QK
+    tensor_accesses:
+    - {name: Q, projection: [b, m, h, e]}
+    - {name: K, projection: { B: b, M: p, H: h, E: e }}
+    - {name: QK, projection: [b, m, p, h], output: True}
+    renames: {weight: K, input: Q, output: QK}
+  - name: QK_softmax
+    tensor_accesses:
+    - {name: QK, projection: [b, m, p, h]}
+    - {name: QK_softmax, projection: [b, m, p, h], output: True}
+    renames: {weight: Nothing}
+  - name: AV
+    tensor_accesses:
+    - {name: QK_softmax, projection: [b, m, p, h]}
+    - {name: V, projection: { B: b, M: p, H: h, E: f}}
+    - {name: AV, projection: [b, m, h, f], output: True}
+    renames: {weight: V, input: QK_softmax}
+  - name: Z
+    tensor_accesses:
+    - {name: AV, projection: [b, m, h, f]}
+    - {name: WZ, projection: [h, f, g], persistent: True}
+    - {name: Z, projection: [b, m, g], output: True}
+  - name: FFA
+    tensor_accesses:
+    - {name: Z, projection: [b, m, g]}
+    - {name: WFFA, projection: [g, c], persistent: True}
+    - {name: FFA, projection: [b, m, c], output: True}
+  - name: FFB
+    tensor_accesses:
+    - {name: FFA, projection: [b, m, c]}
+    - {name: WFFB, projection: [c, j], persistent: True}
+    - {name: FFB, projection: [b, m, j], output: True}
+renames:
+  einsums:
+  - name: default
+    tensor_accesses:
+    - name: input
+      source: Inputs & Intermediates
+      expected_count: 1
+    - name: output
+      source: Outputs
+      expected_count: 1
+    - name: weight
+      source: ~(input | output)
+      expected_count: 1

examples/workloads/matmuls.yaml ADDED Viewed

@@ -0,0 +1,20 @@
+workload:
+  iteration_space_shape:
+    {% set M = M | default(128) %}
+    {% set KN = KN | default(128) %}
+    m:  0 <= m  < {{M}}
+    {% for i in range(N_EINSUMS+1) %}
+    n{{i}}: 0 <= n{{i}} < {{KN}}
+    {% endfor %}
+  bits_per_value: {All: 8}
+  einsums:
+  {% for i in range(N_EINSUMS) %}
+  - name: Matmul{{i}}
+    tensor_accesses:
+    - {name: T{{i}}, projection: [m, n{{i}}]}
+    - {name: W{{i}}, projection: [n{{i}}, n{{i+1}}]}
+    - {name: T{{i+1}}, projection: [m, n{{i+1}}], output: True}
+    renames: {weight: W{{i}}, input: T{{i}}, output: T{{i+1}}}
+  {% endfor %}

examples/workloads/mobilenet_28.yaml ADDED Viewed

@@ -0,0 +1,81 @@
+workload:
+  rank_sizes:
+    {% set BATCH_SIZE = BATCH_SIZE | default(1) %}
+    B: {{BATCH_SIZE}}
+    P0: 28
+    Q0: 28
+    N0: 24
+    T0: 192
+    N1: 24
+    P1: 28
+    Q1: 28
+    P2: 28
+    Q2: 28
+    T1: 192
+    N2: 24
+  bits_per_value: {All: 8}
+  einsums:
+  - name: PiecewiseA0
+    tensor_accesses:
+    - {name: T0, projection: [p0, q0, n0, b]}
+    - {name: WA0, projection: [n0, t0]}
+    - {name: TA0, projection: [p0, q0, t0, b], output: True}
+    renames: {input: T0, output: TA0, weight: WA0}
+  - name: Depthwise0
+    tensor_accesses:
+    - name: TA0
+      projection:
+        P0: p1 + r0
+        Q0: q1 + s0
+        T0: t0
+        B: b
+    - {name: WAB0, projection: [r0, s0, t0]}
+    - {name: TB0, projection: [p1, q1, t0, b], output: True}
+    shape: [0 <= r0 < 3, 0 <= s0 < 3]
+  - name: PiecewiseB0
+    tensor_accesses:
+    - {name: TB0, projection: [p1, q1, t0, b]}
+    - {name: WB0, projection: [t0, n1]}
+    - {name: T1, projection: [p1, q1, n1, b], output: True}
+  - name: PiecewiseA1
+    tensor_accesses:
+    - {name: T1, projection: [p1, q1, n1, b]}
+    - {name: WA1, projection: [n1, t1]}
+    - {name: TA1, projection: [p1, q1, t1, b], output: True}
+  - name: Depthwise1
+    tensor_accesses:
+    - name: TA1
+      projection:
+        P1: p2 + r1
+        Q1: q2 + s1
+        T1: t1
+        B: b
+    - {name: WAB1, projection: [r1, s1, t1]}
+    - {name: TB1, projection: [p2, q2, t1, b], output: True}
+    shape: [1 <= r1 < 3, 1 <= s1 < 3]
+  - name: PiecewiseB2
+    tensor_accesses:
+    - {name: TB1, projection: [p2, q2, t1, b]}
+    - {name: WB1, projection: [t1, n2]}
+    - {name: T2, projection: [p2, q2, n2, b], output: True}
+renames:
+  einsums:
+  - name: default
+    tensor_accesses:
+    - name: input
+      source: Inputs & Intermediates
+      expected_count: 1
+    - name: output
+      source: Outputs
+      expected_count: 1
+    - name: weight
+      source: ~(input | output)
+      expected_count: 1

examples/workloads/mobilenet_various_separate.yaml ADDED Viewed

@@ -0,0 +1,106 @@
+workload:
+  version: "0.5"
+  shape:
+    {% set BATCH_SIZE = BATCH_SIZE | default(1) %}
+    b: 0 <= b < {{BATCH_SIZE}}
+    pp0: 0 <= pp0 < 116
+    qp0: 0 <= qp0 < 116
+    cp0: 0 <= cp0 < 16
+    mp0: 0 <= mp0 < 16
+    pd0: 0 <= pd0 < 116
+    qd0: 0 <= qd0 < 116
+    cd0: 0 <= cd0 < 16
+    rd0: 0 <= rd0 < 3
+    sd0: 0 <= sd0 < 3
+    pp1: 0 <= pp1 < 56
+    qp1: 0 <= qp1 < 56
+    cp1: 0 <= cp1 < 24
+    mp1: 0 <= mp1 < 72
+    pd1: 0 <= pd1 < 56
+    qd1: 0 <= qd1 < 56
+    cd1: 0 <= cd1 < 72
+    rd1: 0 <= rd1 < 5
+    sd1: 0 <= sd1 < 5
+    pp2: 0 <= pp2 < 28
+    qp2: 0 <= qp2 < 28
+    cp2: 0 <= cp2 < 40
+    mp2: 0 <= mp2 < 120
+    pd2: 0 <= pd2 < 28
+    qd2: 0 <= qd2 < 28
+    cd2: 0 <= cd2 < 120
+    rd2: 0 <= rd2 < 3
+    sd2: 0 <= sd2 < 3
+  einsums:
+  - name: P0
+    tensor_accesses:
+    - {name: IP0, projection: [pp0, qp0, cp0, b]}
+    - {name: WP0, projection: [cp0, mp0]}
+    - {name: OP0, projection: [pp0, qp0, mp0, b], output: True}
+    renames: {input: IP0, output: OP0, weight: WP0}
+  - name: D0
+    tensor_accesses:
+    - name: ID0
+      projection:
+        PD0: pd0 + rd0
+        QD0: qd0 + sd0
+        CD0: cd0
+        B: b
+    - {name: WD0, projection: [rd0, sd0, cd0]}
+    - {name: OD0, projection: [pd0, qd0, cd0, b], output: True}
+    renames: {input: ID0, output: OD0, weight: WD0}
+  - name: P1
+    tensor_accesses:
+    - {name: IP1, projection: [pp1, qp1, cp1, b]}
+    - {name: WP1, projection: [cp1, mp1]}
+    - {name: OP1, projection: [pp1, qp1, mp1, b], output: True}
+    renames: {input: IP1, output: OP1, weight: WP1}
+  - name: D1
+    tensor_accesses:
+    - name: ID1
+      projection:
+        PD1: pd1 + rd1
+        QD1: qd1 + sd1
+        CD1: cd1
+        B: b
+    - {name: WD1, projection: [rd1, sd1, cd1]}
+    - {name: OD1, projection: [pd1, qd1, cd1, b], output: True}
+    renames: {input: ID1, output: OD1, weight: WD1}
+  - name: P2
+    tensor_accesses:
+    - {name: IP2, projection: [pp2, qp2, cp2, b]}
+    - {name: WP2, projection: [cp2, mp2]}
+    - {name: OP2, projection: [pp2, qp2, mp2, b], output: True}
+    renames: {input: IP2, output: OP2, weight: WP2}
+  - name: D2
+    tensor_accesses:
+    - name: ID2
+      projection:
+        PD2: pd2 + rd2
+        QD2: qd2 + sd2
+        CD2: cd2
+        B: b
+    - {name: WD2, projection: [rd2, sd2, cd2]}
+    - {name: OD2, projection: [pd2, qd2, cd2, b], output: True}
+    renames: {input: ID2, output: OD2, weight: WD2}
+renames:
+  einsums:
+  - name: default
+    tensor_accesses:
+    - name: input
+      source: Inputs() & Intermediates()
+      expected_count: 1
+    - name: output
+      source: Outputs()
+      expected_count: 1
+    - name: weight
+      source: ~(input | output)
+      expected_count: 1

examples/workloads/three_matmuls_annotated.yaml ADDED Viewed

@@ -0,0 +1,59 @@
+workload:
+  # These rank sizes define the shapes of the tensors in the Einsum. Shapes are assumed
+  # to go from [0, size-1]. Indexes into a rank are omitted if out of range.
+  rank_sizes:
+    M: 128
+    N0: 128
+    N1: 128
+    N2: 128
+    N3: 128
+  # Alternatively, we can constrain each of the rank variables to be within a range. The
+  # values in this dictionary are ISL expressions, and the constraints apply to all
+  # Einsums that use these rank variables.
+  iteration_space_shape:
+    m:  0 <= m  < 128
+    n0: 0 <= n0 < 128
+    n1: 0 <= n1 < 128
+    n2: 0 <= n2 < 128
+    n3: 0 <= n3 < 128
+  # Describe the number of bits of each value of each tensor. This is a dictionary of
+  # set expressions to bits per value for the tensors given by those expressions. They
+  # can be overridden by the bits_per_value attribute of any tensor access.
+  bits_per_value: {All: 8}
+  # The Einsums in the workload.
+  einsums:
+  - name: Matmul1
+    tensor_accesses:
+    - {name: T0, projection: [m, n0]}
+    - {name: W0, projection: [n0, n1]}
+    - {name: T1, projection: [m, n1], output: True}
+    renames: {input: T0}
+  - name: Matmul2
+    tensor_accesses:
+    - {name: T1, projection: [m, n1]}
+    - {name: W1, projection: [n1, n2]}
+    - {name: T2, projection: [m, n2], output: True}
+  - name: Matmul3
+    tensor_accesses:
+    - {name: T2, projection: [m, n2]}
+    - {name: W2, projection: [n2, n3]}
+    - {name: T3, projection: [m, n3], output: True}
+renames:
+  einsums:
+  - name: default
+    tensor_accesses:
+    - name: input
+      source: Inputs & Intermediates
+      expected_count: 1
+    - name: output
+      source: Outputs
+      expected_count: 1
+    - name: weight
+      source: ~(input | output)
+      expected_count: 1