DependableSystemsLab · abrahamchan · Apr 10, 2026 · May 9, 2026 · Apr 10, 2026 · Apr 10, 2026
diff --git a/.clang-format b/.clang-format
@@ -0,0 +1,60 @@
+# clang-format configuration for LLTFI
+#
+# Based on LLVM style (K&R braces, 2-space indent, 80-col limit).
+# Run:  clang-format-20 -i <file.cpp>
+# Or:   lint.sh --fix  (reformats all C++ files in-place)
+
+---
+BasedOnStyle:  LLVM
+Language:      Cpp
+Standard:      c++17
+
+# Indentation
+IndentWidth:            2
+TabWidth:               2
+UseTab:                 Never
+ContinuationIndentWidth: 4
+IndentCaseLabels:       false
+IndentPPDirectives:     None
+
+# Line length
+ColumnLimit:  80
+
+# Line break
+LineEnding: LF
+
+# Braces — attach (K&R / LLVM style)
+BreakBeforeBraces: Attach
+
+# Includes
+SortIncludes:           CaseSensitive
+IncludeBlocks:          Regroup
+IncludeCategories:
+  # LLTFI local headers first
+  - Regex:    '^"(FI|Utils|Controller|Profil|Inst|Reg|Gen|LLFIDot)'
+    Priority: 1
+  # LLVM headers
+  - Regex:    '^"llvm/'
+    Priority: 2
+  # System headers
+  - Regex:    '^<'
+    Priority: 3
+
+# Pointer alignment: right (int *p, not int* p)
+PointerAlignment: Right
+
+# Function arguments
+AllowAllArgumentsOnNextLine:           true
+AllowAllParametersOfDeclarationOnNextLine: true
+BinPackArguments:  true
+BinPackParameters: true
+
+# Short constructs — keep consistent with LLVM defaults
+AllowShortFunctionsOnASingleLine: Inline
+AllowShortIfStatementsOnASingleLine: Never
+AllowShortLoopsOnASingleLine: false
+
+# Misc
+SpaceBeforeParens:     ControlStatements
+SpacesInAngles:        Never
+SpacesInParentheses:   false
diff --git a/.clang-tidy b/.clang-tidy
@@ -0,0 +1,62 @@
+# clang-tidy configuration for LLTFI
+#
+# Run from the repo root (requires compile_commands.json in the build dir):
+#   clang-tidy-20 -p /path/to/LLTFI-build <file.cpp>
+# Or use lint.sh which handles discovery automatically.
+#
+# To generate compile_commands.json, add -DCMAKE_EXPORT_COMPILE_COMMANDS=ON
+# to the cmake invocation inside ./setup, or run:
+#   cd /path/to/LLTFI-build && cmake -DCMAKE_EXPORT_COMPILE_COMMANDS=ON .
+
+---
+Checks: >
+  bugprone-*,
+  clang-analyzer-core.*,
+  clang-analyzer-cplusplus.*,
+  clang-analyzer-deadcode.*,
+  clang-analyzer-security.*,
+  cppcoreguidelines-init-variables,
+  cppcoreguidelines-narrowing-conversions,
+  cppcoreguidelines-slicing,
+  llvm-namespace-comment,
+  llvm-twine-local,
+  modernize-use-nullptr,
+  modernize-use-override,
+  modernize-redundant-void-arg,
+  performance-for-range-copy,
+  performance-implicit-conversion-in-loop,
+  performance-unnecessary-copy-initialization,
+  readability-const-return-type,
+  readability-container-size-empty,
+  readability-delete-null-pointer,
+  readability-misplaced-array-index,
+  readability-redundant-declaration,
+  -bugprone-easily-swappable-parameters,
+  -bugprone-macro-parentheses,
+  -bugprone-branch-clone,
+  -bugprone-assignment-in-if-condition,
+  -clang-analyzer-optin.*,
+  -clang-analyzer-cplusplus.NewDelete,
+  -clang-diagnostic-macro-redefined,
+
+# Checks disabled because they fire heavily on legitimate LLVM-pass idioms:
+#   cppcoreguidelines-pro-bounds-*   — pointer arithmetic is normal in LLVM IR
+#   cppcoreguidelines-pro-type-*     — reinterpret_cast used in IR manipulation
+#   cppcoreguidelines-avoid-magic-numbers — opcode numbers are intentional
+#   cppcoreguidelines-pro-type-vararg    — some C APIs use varargs
+#   modernize-use-trailing-return-type   — not in our style guide
+
+WarningsAsErrors: ''
+
+HeaderFilterRegex: 'llvm_passes/.*\.h$'
+
+CheckOptions:
+  # Enforce nullptr over NULL
+  - key:   modernize-use-nullptr.NullMacros
+    value: 'NULL'
+
+  # Namespace comment style: closing brace should say "// namespace llfi"
+  - key:   llvm-namespace-comment.ShortNamespaceLines
+    value: '10'
+  - key:   llvm-namespace-comment.SpacesBeforeComments
+    value: '2'
diff --git a/.editorconfig b/.editorconfig
@@ -0,0 +1,26 @@
+root = true
+
+[*]
+charset = utf-8
+end_of_line = lf
+insert_final_newline = true
+trim_trailing_whitespace = true
+
+[*.{cpp,h,c}]
+indent_style = space
+indent_size = 2
+
+[*.py]
+indent_style = space
+indent_size = 4
+
+[*.{yaml,yml}]
+indent_style = space
+indent_size = 2
+
+[CMakeLists.txt]
+indent_style = space
+indent_size = 2
+
+[Makefile]
+indent_style = tab
diff --git a/.gitignore b/.gitignore
@@ -6,17 +6,7 @@ config/java_paths.cmake
 config/java_paths.py
 tools/zgrviewer/llfi_run.sh
 
-# Same holds for the installer directory
-installer/downloads/*
-installer/llfi/*
-installer/llfisrc/*
-installer/llvm/*
-installer/llvmsrc/*
-installer/pyyaml/*
-installer/pyyamlsrc/*
-installer/fontconfig/*
 build/
-sample_programs/
 
 # All the .ll and .bc files
 *.ll
@@ -28,8 +18,9 @@ sample_programs/
 __pycache__/
 *.pyc
 
-# FIDL-generated software fault selector files (regenerated by setup via FIDL-Algorithm.py)
-llvm_passes/software_failures/_*_*Selector.cpp
+# protobuf build artifacts (downloaded during ML dependency setup)
+protobuf-*/
+protobuf-all-*.zip
 
 # gedit backup files
 *~
@@ -56,7 +47,3 @@ gui/sum/
 gui/min/
 gui/bfs/
 
-# web app
-web-app/node_modules/
-web-app/views/bundle.min.js
-web-app/server/uploads/*
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -0,0 +1,160 @@
+# Changelog
+
+All notable changes to LLTFI are recorded here.
+Format follows [Keep a Changelog](https://keepachangelog.com/en/1.0.0/).
+
+---
+
+## [Unreleased] — LLVM 20 branch (`LLVM20`)
+
+This release upgrades LLTFI from LLVM 15 to LLVM 20.  Every change is
+backward-compatible with LLFI.  The full migration narrative, task breakdown,
+and effort accounting are in `migration.md`.
+
+### Breaking changes
+
+- **LLVM version requirement raised from 15 to 20.**  LLVM 15 is no longer
+  supported.  Install LLVM 20 via the LLVM apt repository or build from source
+  (see `README.md`).
+- **Legacy pass manager (`opt -load`, `-enable-new-pm=0`) removed.**  All
+  passes — including `InstructionDuplication` — now use the new pass manager
+  exclusively.  Any external scripts calling `opt` directly must be updated to
+  use `-load-pass-plugin` and `--passes=<PassName>`.
+- **`InstructionDuplication` pass renamed** to `InstructionDuplicationPass` in
+  the plugin registry to match the new PM convention.
+
+---
+
+### Added
+
+#### New passes and tests
+- `InstructionDuplication` migrated to the new pass manager (`PassInfoMixin`);
+  exposed as `"InstructionDuplicationPass"` in `SEDPasses.so`.
+- Two new tests in `test_instruction_duplication.py`:
+  - `real_model_structural` — applies `InstructionDuplicationPass` to a real
+    onnx-mlir `model.ll` and verifies `compareFloatValues` calls are inserted.
+  - `real_model_end_to_end` — runs the baseline and duplicated models through
+    `lli` and asserts outputs are identical (SKIP when `model.ll` absent).
+
+#### Tooling
+- `lint.sh` — unified C++ and Python lint runner; `--fix` auto-formats in-place.
+- `.clang-tidy` — project-level tidy config with intentionally disabled checks
+  documented.
+- `.clang-format` — project-level format config (LLVM style, 2-space indent).
+- `setup.cfg` — `flake8` and `flake8-bugbear` configuration for Python linting.
+
+#### Documentation
+- `architecture.md` — new developer reference covering pass pipeline, selector
+  class hierarchy, hardware/software/ML fault modes, the runtime library, and
+  the interface between compile-time and runtime layers.
+- `docs/input_yaml_guide.md` — prose guide to writing `input.yaml` files,
+  covering all keys, `CustomTensorOperator` ML targeting, and complete examples.
+- `docs/tutorial_first_experiment.md` — end-to-end walkthrough of the
+  `factorial` experiment including output file interpretation and outcome
+  classification (masked / SDC / crash / hang).
+- `docs/adding_a_test.md` — step-by-step guide for adding a regression test,
+  covering program registration, test case structure, custom Python scripts,
+  and the SKIP convention.
+- `CODING_GUIDELINES.md` — expanded with sections on `override`, variable
+  initialisation, container emptiness (`.empty()` over `.size() == 0`), and
+  `cast<>` vs. `dyn_cast<>`.
+- `CONTRIBUTING.md` — added `Adding a Test Case` section pointing to
+  `docs/adding_a_test.md`.
+- `docs/tutorial_ml_experiment.md` — new end-to-end walkthrough of an ML/ONNX
+  fault injection experiment covering the full ONNX → LLVM IR compilation
+  pipeline, `CustomTensorOperator` layer targeting, multi-fault injection
+  options, per-layer profiling output, and `CompareLayerOutputs.py`.
+
+---
+
+### Changed
+
+#### LLVM 20 API compatibility
+
+| File | Change |
+|------|--------|
+| `llvm_passes/core/FaultInjectionPass.cpp` | 3 sites: `new AllocaInst/StoreInst/LoadInst` constructors updated to LLVM 17+ API |
+| `llvm_passes/core/InstTracePass.cpp` | 6 sites: same; `getFirstNonPHIOrDbgOrLifetime()` now returns `BasicBlock::iterator` |
+| `llvm_passes/core/Utils.cpp` | `M.getGlobalList().push_back()` → `new GlobalVariable(M, ...)` (removed in LLVM 17) |
+| All selector `.cpp` files | `getNumArgOperands()` → `arg_size()` (removed in LLVM 15); `#include "llvm/Support/CFG.h"` → `"llvm/IR/CFG.h"` |
+| `llvm_passes/instruction_duplication/InstructionDuplication.cpp` | `getNextNonDebugInstruction()` return type updated to `BasicBlock::iterator` |
+
+#### Code quality (C++ — found by clang-tidy and code review)
+
+| Category | Details |
+|----------|---------|
+| Bug fixes | Double-free in `Controller.cpp` destructor; file stream leak in `LLFIDotGraphPass.cpp`; unchecked `fopen` null in `GenLLFIIndexPass.cpp`; uninitialized `isChainDuplication` field |
+| Null safety | `getCalledFunction()` null checks in `ProfilingPass.cpp`, `InstructionDuplication.cpp`, `CustomTensorOperatorInstSelector.cpp` |
+| LLVM idioms | `dyn_cast<>` after `isa<>` → `cast<>` (asserting) across `Utils.cpp`, `ProfilingPass.cpp`; `NULL` → `nullptr` throughout |
+| Override safety | `virtual` on override methods → `override` keyword across all selector classes; `virtual ~Base() = default` added to abstract base classes |
+| Style | `.empty()` over `.size() == 0`; `const auto&` in range-for; `strncpy`/`strncat` over unbounded `strcpy`/`strcat`; `cl::opt<T>::getValue()` to avoid slicing |
+| Dead code | Removed unreachable `return false` after exhaustive if/else in `InstructionDuplication.cpp:runOnMainGraph()` |
+| Copies | `for (auto insVector : arithInst)` → `for (const auto& insVector : ...)` to avoid copying inner vectors |
+
+#### Code quality (Python — found by flake8/bugbear)
+
+- `except:` → `except Exception:` throughout `bin/`, `tools/`, `test_suite/SCRIPTS/`
+- Bare `open()` → `with open(...) as f:` in multiple scripts
+- `subprocess(..., shell=True)` removed; replaced with list-form calls
+- `yaml.load()` → `yaml.safe_load()` everywhere
+- `exit()` → `sys.exit()` in scripts
+- `%-format` strings → f-strings in new code
+
+#### Docker
+
+- `docker/Dockerfile` — LLVM source checkout updated from a pinned LLVM 15
+  commit hash (`9778ec057cf4`) to the `llvmorg-20.1.0` tag; `pyyaml===5.4.1`
+  corrected to `pyyaml==5.4.1` (non-standard triple-equals syntax).
+
+#### Documentation updates
+
+- `README.md` — restructured to eliminate overlap with `architecture.md`;
+  added `docs/` section listing all user guides; added pointer to
+  `architecture.md` for internal design.
+- `caveats.txt` — LLVM version references updated 15 → 20; duplicate item
+  number fixed.
+- `llvm_passes/instruction_duplication/README.md` — `opt -always-inline`
+  (legacy PM) → `opt --passes=always-inline` (new PM).
+- `llvm_passes/instruction_duplication/shared_lib/build.sh` and
+  `compile_shrd_lib.sh` — hardcoded `clang`/`clang++` → `LLVM_GXX_BIN_DIR`
+  pattern, fixing builds on Ubuntu where apt installs `clang-20` only.
+- `architecture.md` — corrected several inaccuracies found during code review:
+  `preFunc` return type (`bool` not `int`) and parameter types (`unsigned`
+  throughout); `injectFunc` register parameter types; `doProfiling` parameter
+  type (`int` not `unsigned`); `printInstTracer` signature (second param is
+  `char *opcode`, not `unsigned`; last param is `int`, not `long`);
+  `lltfiMLLayer` parameter types (`int64_t`); removed non-existent `random`
+  and `data_corruption` `fi_type` entries; corrected claim that
+
+---
+
+### Pending before merge (human tasks)
+
+- **H-2** — Human review of IRBuilder insertion-point correctness in
+  `FaultInjectionPass.cpp` and `InstTracePass.cpp`.  The `AllocaInst` calls
+  were migrated to `BasicBlock*` insertAtEnd form and `BasicBlock::iterator`
+  form respectively; both compile and all 21 tests pass, but a developer
+  familiar with the pass semantics should verify the insertion points are
+  logically correct before merging to main.
+- **H-3** — onnx-mlir real-model validation.  Requires installing onnx-mlir and
+  running `sample_programs/ml_sample_programs/vision_models/mnist/compile.sh`
+  to produce `model.ll`.  The two new `test_instruction_duplication.py` tests
+  will then run instead of skipping.  Not a blocker — all other tests pass.
+
+---
+
+## [Previous] — LLVM 15 baseline (`master`)
+
+The `master` branch represents LLTFI as it existed targeting LLVM 15, with
+the following improvements over the original LLFI fork:
+
+- ML fault injection support (TensorFlow, PyTorch via ONNX-MLIR)
+- `CustomTensorOperator` instruction selector for layer-level ML targeting
+- `InstructionDuplication` pass (`SEDPasses.so`) for soft-error detection
+- Batch fault injection scripts (`batchInstrument.py`, `batchProfile.py`,
+  `batchInjectfault.py`)
+- Trace analysis tools (`tracediff.py`, `traceontograph.py`, `traceunion.py`,
+  `tracetodot.py`)
+- Makefile generation tool (`GenerateMakefile`)
+- Initial `CODING_GUIDELINES.md` and `CONTRIBUTING.md`
+- Migration plan document (`migration.md`) for the LLVM 15 → 20 upgrade