deploy: 12e85cb778

2025-08-04 11:00:05 +00:00 · 2022-08-21 10:24:24 +00:00 · 2022-08-21 10:24:24 +00:00 · 661232845e
commit 661232845e
parent f01db459c5
9 changed files with 342 additions and 92 deletions
--- a/print.html
+++ b/print.html
@ -575,14 +575,18 @@ This permits the crates to define private functions and other things that are me
 </span><span class="boring">fn main() {
 </span>#[salsa::jar(db = Db)]
 pub struct Jar(
+    crate::compile::compile,
    crate::ir::SourceProgram,
+    crate::ir::Program,
    crate::ir::VariableId,
    crate::ir::FunctionId,
-    crate::ir::Expression,
-    crate::ir::Statement,
    crate::ir::Function,
    crate::ir::Diagnostics,
+    crate::ir::Span,
    crate::parser::parse_statements,
+    crate::type_check::type_check_program,
+    crate::type_check::type_check_function,
+    crate::type_check::find_function,
 );
 <span class="boring">}
 </span></code></pre></pre>
@ -648,6 +652,10 @@ the one which starts up the program, supplies the inputs, and relays the outputs
 </span>#[salsa::db(crate::Jar)]
 pub(crate) struct Database {
    storage: salsa::Storage&lt;Self&gt;,
+
+    // The logs are only used for testing and demonstrating reuse:
+    //
+    logs: Option&lt;Arc&lt;Mutex&lt;Vec&lt;String&gt;&gt;&gt;&gt;,
 }
 <span class="boring">}
 </span></code></pre></pre>
@ -665,6 +673,22 @@ This means that</p>
    fn salsa_runtime(&amp;self) -&gt; &amp;salsa::Runtime {
        self.storage.runtime()
    }
+
+    fn salsa_event(&amp;self, event: salsa::Event) {
+        // Log interesting events, if logging is enabled
+        if let Some(logs) = &amp;self.logs {
+            match event.kind {
+                salsa::EventKind::WillExecute { .. } =&gt; {
+                    logs.lock()
+                        .unwrap()
+                        .push(format!(&quot;Event: {:?}&quot;, event.debug(self)));
+                }
+                _ =&gt; {
+                    // don't log boring events
+                }
+            }
+        }
+    }
 }
 <span class="boring">}
 </span></code></pre></pre>
@ -677,6 +701,7 @@ This means that</p>
    fn snapshot(&amp;self) -&gt; salsa::Snapshot&lt;Self&gt; {
        salsa::Snapshot::new(Database {
            storage: self.storage.snapshot(),
+            logs: self.logs.clone(),
        })
    }
 }
@ -691,6 +716,7 @@ This means that</p>
    fn default() -&gt; Self {
        Self {
            storage: Default::default(),
+            logs: None,
        }
    }
 }
@ -767,10 +793,39 @@ as explained in <a href="tutorial/../overview.html#goal-of-salsa">the overview</
 When you change the value of an input field, that increments a 'revision counter' in the database,
 indicating that some inputs are different now.
 When we talk about a &quot;revision&quot; of the database, we are referring to the state of the database in between changes to the input values.</p>
-<h2 id="tracked-structs-1"><a class="header" href="#tracked-structs-1">Tracked structs</a></h2>
-<p>Next we will define a <strong>tracked struct</strong> to represent the functions in our input.
-Whereas inputs represent the <em>start</em> of a computation, tracked structs represent intermediate values created during your computation.
-In this case, we are going to parse the raw input program, and create a <code>Function</code> for each of the functions defined by the user.</p>
+<h3 id="representing-the-parsed-program"><a class="header" href="#representing-the-parsed-program">Representing the parsed program</a></h3>
+<p>Next we will define a <strong>tracked struct</strong>.
+Whereas inputs represent the <em>start</em> of a computation, tracked structs represent intermediate values created during your computation.</p>
+<p>In this case, the parser is going to take in the <code>SourceProgram</code> struct that we saw and return a <code>Program</code> that represents the fully parsed program:</p>
+<pre><pre class="playground"><code class="language-rust">
+<span class="boring">#![allow(unused)]
+</span><span class="boring">fn main() {
+</span>#[salsa::tracked]
+pub struct Program {
+    #[return_ref]
+    statements: Vec&lt;Statement&gt;,
+}
+<span class="boring">}
+</span></code></pre></pre>
+<p>Like with an input, the fields of a tracked struct are also stored in the database.
+Unlike an input, those fields are immutable (they cannot be &quot;set&quot;), and salsa compares them across revisions to know when they have changed.
+In this case, if parsing the input produced the same <code>Program</code> result (e.g., because the only change to the input was some trailing whitespace, perhaps),
+then subsequent parts of the computation won't need to re-execute.
+(We'll revisit the role of tracked structs in reuse more in future parts of the IR.)</p>
+<p>Apart from the fields being immutable, the API for working with a tracked struct is quite similar to an input:</p>
+<ul>
+<li>You can create a new value by using <code>new</code>, but with a tracked struct, you only need an <code>&amp;dyn</code> database, not <code>&amp;mut</code> (e.g., <code>Program::new(&amp;db, some_staements)</code>)</li>
+<li>You use a getter to read the value of a field, just like with an input (e.g., <code>my_func.statements(db)</code> to read the <code>statements</code> field).
+<ul>
+<li>In this case, the field is tagged as <code>#[return_ref]</code>, which means that the getter will return a <code>&amp;Vec&lt;Statement&gt;</code>, instead of cloning the vector.</li>
+</ul>
+</li>
+</ul>
+<h2 id="representing-functions"><a class="header" href="#representing-functions">Representing functions</a></h2>
+<p>We will also use a tracked struct to represent each function:
+Next we will define a <strong>tracked struct</strong>.
+Whereas inputs represent the <em>start</em> of a computation, tracked structs represent intermediate values created during your computation.</p>
+<p>The <code>Function</code> struct is going to be created by the parser to represent each of the functions defined by the user:</p>
 <pre><pre class="playground"><code class="language-rust">
 <span class="boring">#![allow(unused)]
 </span><span class="boring">fn main() {
@ -778,12 +833,24 @@ In this case, we are going to parse the raw input program, and create a <code>Fu
 pub struct Function {
    #[id]
    name: FunctionId,
+
+    name_span: Span,
+
+    #[return_ref]
    args: Vec&lt;VariableId&gt;,
+
+    #[return_ref]
    body: Expression,
 }
 <span class="boring">}
 </span></code></pre></pre>
-<p>Unlike with inputs, the fields of tracked structs are immutable once created. Otherwise, working with a tracked struct is quite similar to an input:</p>
+<p>Like with an input, the fields of a tracked struct are also stored in the database.
+Unlike an input, those fields are immutable (they cannot be &quot;set&quot;), and salsa compares them across revisions to know when they have changed.
+If we had created some <code>Function</code> instance <code>f</code>, for example, we might find that <code>the f.body</code> field changes
+because the user changed the definition of <code>f</code>.
+This would mean that we have to re-execute those parts of the code that depended on <code>f.body</code>
+(but not those parts of the code that depended on the body of <em>other</em> functions).</p>
+<p>Apart from the fields being immutable, the API for working with a tracked struct is quite similar to an input:</p>
 <ul>
 <li>You can create a new value by using <code>new</code>, but with a tracked struct, you only need an <code>&amp;dyn</code> database, not <code>&amp;mut</code> (e.g., <code>Function::new(&amp;db, some_name, some_args, some_body)</code>)</li>
 <li>You use a getter to read the value of a field, just like with an input (e.g., <code>my_func.args(db)</code> to read the <code>args</code> field).</li>
@ -828,17 +895,26 @@ let f2 = FunctionId::new(&amp;db, &quot;my_string&quot;.to_string());
 assert_eq!(f1, f2);
 <span class="boring">}
 </span></code></pre></pre>
+<h3 id="interned-ids-are-guaranteed-to-be-consistent-within-a-revision-but-not-across-revisions-but-you-dont-have-to-care"><a class="header" href="#interned-ids-are-guaranteed-to-be-consistent-within-a-revision-but-not-across-revisions-but-you-dont-have-to-care">Interned ids are guaranteed to be consistent within a revision, but not across revisions (but you don't have to care)</a></h3>
+<p>Interned ids are guaranteed not to change within a single revision, so you can intern things from all over your program and get back consistent results.
+When you change the inputs, however, salsa may opt to clear some of the interned values and choose different integers.
+However, if this happens, it will also be sure to re-execute every function that interned that value, so all of them still see a consistent value,
+just a different one than they saw in a previous revision.</p>
+<p>In other words, within a salsa computation, you can assume that interning produces a single consistent integer, and you don't have to think about it.
+If however you export interned identifiers outside the computation, and then change the inputs, they may not longer be valid or may refer to different values.</p>
 <h3 id="expressions-and-statements"><a class="header" href="#expressions-and-statements">Expressions and statements</a></h3>
-<p>We'll also intern expressions and statements. This is convenient primarily because it allows us to have recursive structures very easily. Since we don't really need the &quot;cheap equality comparison&quot; aspect of interning, this isn't the most efficient choice, and many compilers would opt to represent expressions/statements in some other way.</p>
+<p>We'll won't use any special &quot;salsa structs&quot; for expressions and statements:</p>
 <pre><pre class="playground"><code class="language-rust">
 <span class="boring">#![allow(unused)]
 </span><span class="boring">fn main() {
-</span>#[salsa::interned]
+</span>#[derive(Eq, PartialEq, Debug, Hash, new)]
 pub struct Statement {
-    data: StatementData,
+    pub span: Span,
+
+    pub data: StatementData,
 }

-#[derive(Eq, PartialEq, Clone, Hash)]
+#[derive(Eq, PartialEq, Debug, Hash)]
 pub enum StatementData {
    /// Defines `fn &lt;name&gt;(&lt;args&gt;) = &lt;body&gt;`
    Function(Function),
@ -846,15 +922,16 @@ pub enum StatementData {
    Print(Expression),
 }

-#[salsa::interned]
+#[derive(Eq, PartialEq, Debug, Hash, new)]
 pub struct Expression {
-    #[return_ref]
-    data: ExpressionData,
+    pub span: Span,
+
+    pub data: ExpressionData,
 }

-#[derive(Eq, PartialEq, Clone, Hash)]
+#[derive(Eq, PartialEq, Debug, Hash)]
 pub enum ExpressionData {
-    Op(Expression, Op, Expression),
+    Op(Box&lt;Expression&gt;, Op, Box&lt;Expression&gt;),
    Number(OrderedFloat&lt;f64&gt;),
    Variable(VariableId),
    Call(FunctionId, Vec&lt;Expression&gt;),
@ -869,13 +946,10 @@ pub enum Op {
 }
 <span class="boring">}
 </span></code></pre></pre>
-<h3 id="interned-ids-are-guaranteed-to-be-consistent-within-a-revision-but-not-across-revisions-but-you-dont-have-to-care"><a class="header" href="#interned-ids-are-guaranteed-to-be-consistent-within-a-revision-but-not-across-revisions-but-you-dont-have-to-care">Interned ids are guaranteed to be consistent within a revision, but not across revisions (but you don't have to care)</a></h3>
-<p>Interned ids are guaranteed not to change within a single revision, so you can intern things from all over your program and get back consistent results.
-When you change the inputs, however, salsa may opt to clear some of the interned values and choose different integers.
-However, if this happens, it will also be sure to re-execute every function that interned that value, so all of them still see a consistent value,
-just a different one than they saw in a previous revision.</p>
-<p>In other words, within a salsa computation, you can assume that interning produces a single consistent integer, and you don't have to think about it.
-If however you export interned identifiers outside the computation, and then change the inputs, they may not longer be valid or may refer to different values.</p>
+<p>Since statements and expressions are not tracked, this implies that we are only attempting to get incremental re-use at the granularity of functions --
+whenever anything in a function body changes, we consider the entire function body dirty and re-execute anything that depended on it.
+It usually makes sense to draw some kind of &quot;reasonably coarse&quot; boundary like this.</p>
+<p>One downside of the way we have set things up: we inlined the position into each of the structs.</p>
 <div style="break-before: page; page-break-before: always;"></div><h1 id="defining-the-parser-memoized-functions-and-inputs"><a class="header" href="#defining-the-parser-memoized-functions-and-inputs">Defining the parser: memoized functions and inputs</a></h1>
 <p>The next step in the <code>calc</code> compiler is to define the parser.
 The role of the parser will be to take the <code>ProgramSource</code> input,
@ -890,8 +964,8 @@ We're going to focus only on the salsa-related aspects.</p>
 <pre><pre class="playground"><code class="language-rust">
 <span class="boring">#![allow(unused)]
 </span><span class="boring">fn main() {
-</span>#[salsa::tracked(return_ref)]
-pub fn parse_statements(db: &amp;dyn crate::Db, source: SourceProgram) -&gt; Vec&lt;Statement&gt; {
+</span>#[salsa::tracked]
+pub fn parse_statements(db: &amp;dyn crate::Db, source: SourceProgram) -&gt; Program {
    // Get the source text from the database
    let source_text = source.text(db);

@ -925,7 +999,7 @@ pub fn parse_statements(db: &amp;dyn crate::Db, source: SourceProgram) -&gt; Vec
        }
    }

-    result
+    Program::new(db, result)
 }
 <span class="boring">}
 </span></code></pre></pre>
@ -982,9 +1056,10 @@ In our case, we define an accumulator struct called <code>Diagnostics</code> in
 </span>#[salsa::accumulator]
 pub struct Diagnostics(Diagnostic);

-#[derive(Clone, Debug)]
+#[derive(new, Clone, Debug)]
 pub struct Diagnostic {
-    pub position: usize,
+    pub start: usize,
+    pub end: usize,
    pub message: String,
 }
 <span class="boring">}
@ -1000,10 +1075,15 @@ or any function that it called
 </span><span class="boring">fn main() {
 </span>    /// Report an error diagnostic at the current position.
    fn report_error(&amp;self) {
+        let next_position = match self.peek() {
+            Some(ch) =&gt; self.position + ch.len_utf8(),
+            None =&gt; self.position,
+        };
        Diagnostics::push(
            self.db,
            Diagnostic {
-                position: self.position,
+                start: self.position,
+                end: next_position,
                message: &quot;unexpected character&quot;.to_string(),
            },
        );
@ -1048,7 +1128,7 @@ This is tedious but not difficult. Here is an example of implementing the trait
 </span><span class="boring">fn main() {
 </span>impl DebugWithDb&lt;dyn crate::Db + '_&gt; for Expression {
    fn fmt(&amp;self, f: &amp;mut std::fmt::Formatter&lt;'_&gt;, db: &amp;dyn crate::Db) -&gt; std::fmt::Result {
-        match self.data(db) {
+        match &amp;self.data {
            ExpressionData::Op(a, b, c) =&gt; f
                .debug_tuple(&quot;ExpressionData::Op&quot;)
                .field(&amp;a.debug(db)) // use `a.debug(db)` for interned things
@ -1098,16 +1178,29 @@ impl DebugWithDb&lt;dyn crate::Db + '_&gt; for Diagnostic {
 pub struct Function {
    #[id]
    name: FunctionId,
+
+    name_span: Span,
+
+    #[return_ref]
    args: Vec&lt;VariableId&gt;,
+
+    #[return_ref]
    body: Expression,
 }

+#[salsa::tracked]
+pub struct Span {
+    pub start: usize,
+    pub end: usize,
+}
+
 #[salsa::accumulator]
 pub struct Diagnostics(Diagnostic);

-#[derive(Clone, Debug)]
+#[derive(new, Clone, Debug)]
 pub struct Diagnostic {
-    pub position: usize,
+    pub start: usize,
+    pub end: usize,
    pub message: String,
 }
 <span class="boring">}
@ -1150,21 +1243,53 @@ fn parse_print() {
    let actual = parse_string(&quot;print 1 + 2&quot;);
    let expected = expect_test::expect![[r#&quot;
        (
-            [
-                ExpressionData::Op(
-                    Number(
-                        OrderedFloat(
-                            1.0,
+            Program {
+                statements: [
+                    Statement {
+                        span: Span(
+                            Id {
+                                value: 5,
+                            },
                        ),
-                    ),
-                    Add,
-                    Number(
-                        OrderedFloat(
-                            2.0,
+                        data: Print(
+                            Expression {
+                                span: Span(
+                                    Id {
+                                        value: 4,
+                                    },
+                                ),
+                                data: Op(
+                                    Expression {
+                                        span: Span(
+                                            Id {
+                                                value: 1,
+                                            },
+                                        ),
+                                        data: Number(
+                                            OrderedFloat(
+                                                1.0,
+                                            ),
+                                        ),
+                                    },
+                                    Add,
+                                    Expression {
+                                        span: Span(
+                                            Id {
+                                                value: 3,
+                                            },
+                                        ),
+                                        data: Number(
+                                            OrderedFloat(
+                                                2.0,
+                                            ),
+                                        ),
+                                    },
+                                ),
+                            },
                        ),
-                    ),
-                ),
-            ],
+                    },
+                ],
+            },
            [],
        )&quot;#]];
    expected.assert_eq(&amp;actual);
--- a/searchindex.js
+++ b/searchindex.js
--- a/searchindex.json
+++ b/searchindex.json
--- a/tutorial/accumulators.html
+++ b/tutorial/accumulators.html
@ -157,9 +157,10 @@ In our case, we define an accumulator struct called <code>Diagnostics</code> in
 </span>#[salsa::accumulator]
 pub struct Diagnostics(Diagnostic);

-#[derive(Clone, Debug)]
+#[derive(new, Clone, Debug)]
 pub struct Diagnostic {
-    pub position: usize,
+    pub start: usize,
+    pub end: usize,
    pub message: String,
 }
 <span class="boring">}
@ -175,10 +176,15 @@ or any function that it called
 </span><span class="boring">fn main() {
 </span>    /// Report an error diagnostic at the current position.
    fn report_error(&amp;self) {
+        let next_position = match self.peek() {
+            Some(ch) =&gt; self.position + ch.len_utf8(),
+            None =&gt; self.position,
+        };
        Diagnostics::push(
            self.db,
            Diagnostic {
-                position: self.position,
+                start: self.position,
+                end: next_position,
                message: &quot;unexpected character&quot;.to_string(),
            },
        );
--- a/tutorial/db.html
+++ b/tutorial/db.html
@ -156,6 +156,10 @@ the one which starts up the program, supplies the inputs, and relays the outputs
 </span>#[salsa::db(crate::Jar)]
 pub(crate) struct Database {
    storage: salsa::Storage&lt;Self&gt;,
+
+    // The logs are only used for testing and demonstrating reuse:
+    //
+    logs: Option&lt;Arc&lt;Mutex&lt;Vec&lt;String&gt;&gt;&gt;&gt;,
 }
 <span class="boring">}
 </span></code></pre></pre>
@ -173,6 +177,22 @@ This means that</p>
    fn salsa_runtime(&amp;self) -&gt; &amp;salsa::Runtime {
        self.storage.runtime()
    }
+
+    fn salsa_event(&amp;self, event: salsa::Event) {
+        // Log interesting events, if logging is enabled
+        if let Some(logs) = &amp;self.logs {
+            match event.kind {
+                salsa::EventKind::WillExecute { .. } =&gt; {
+                    logs.lock()
+                        .unwrap()
+                        .push(format!(&quot;Event: {:?}&quot;, event.debug(self)));
+                }
+                _ =&gt; {
+                    // don't log boring events
+                }
+            }
+        }
+    }
 }
 <span class="boring">}
 </span></code></pre></pre>
@ -185,6 +205,7 @@ This means that</p>
    fn snapshot(&amp;self) -&gt; salsa::Snapshot&lt;Self&gt; {
        salsa::Snapshot::new(Database {
            storage: self.storage.snapshot(),
+            logs: self.logs.clone(),
        })
    }
 }
@ -199,6 +220,7 @@ This means that</p>
    fn default() -&gt; Self {
        Self {
            storage: Default::default(),
+            logs: None,
        }
    }
 }
--- a/tutorial/debug.html
+++ b/tutorial/debug.html
@ -169,7 +169,7 @@ This is tedious but not difficult. Here is an example of implementing the trait
 </span><span class="boring">fn main() {
 </span>impl DebugWithDb&lt;dyn crate::Db + '_&gt; for Expression {
    fn fmt(&amp;self, f: &amp;mut std::fmt::Formatter&lt;'_&gt;, db: &amp;dyn crate::Db) -&gt; std::fmt::Result {
-        match self.data(db) {
+        match &amp;self.data {
            ExpressionData::Op(a, b, c) =&gt; f
                .debug_tuple(&quot;ExpressionData::Op&quot;)
                .field(&amp;a.debug(db)) // use `a.debug(db)` for interned things
@ -219,16 +219,29 @@ impl DebugWithDb&lt;dyn crate::Db + '_&gt; for Diagnostic {
 pub struct Function {
    #[id]
    name: FunctionId,
+
+    name_span: Span,
+
+    #[return_ref]
    args: Vec&lt;VariableId&gt;,
+
+    #[return_ref]
    body: Expression,
 }

+#[salsa::tracked]
+pub struct Span {
+    pub start: usize,
+    pub end: usize,
+}
+
 #[salsa::accumulator]
 pub struct Diagnostics(Diagnostic);

-#[derive(Clone, Debug)]
+#[derive(new, Clone, Debug)]
 pub struct Diagnostic {
-    pub position: usize,
+    pub start: usize,
+    pub end: usize,
    pub message: String,
 }
 <span class="boring">}
@ -271,21 +284,53 @@ fn parse_print() {
    let actual = parse_string(&quot;print 1 + 2&quot;);
    let expected = expect_test::expect![[r#&quot;
        (
-            [
-                ExpressionData::Op(
-                    Number(
-                        OrderedFloat(
-                            1.0,
+            Program {
+                statements: [
+                    Statement {
+                        span: Span(
+                            Id {
+                                value: 5,
+                            },
                        ),
-                    ),
-                    Add,
-                    Number(
-                        OrderedFloat(
-                            2.0,
+                        data: Print(
+                            Expression {
+                                span: Span(
+                                    Id {
+                                        value: 4,
+                                    },
+                                ),
+                                data: Op(
+                                    Expression {
+                                        span: Span(
+                                            Id {
+                                                value: 1,
+                                            },
+                                        ),
+                                        data: Number(
+                                            OrderedFloat(
+                                                1.0,
+                                            ),
+                                        ),
+                                    },
+                                    Add,
+                                    Expression {
+                                        span: Span(
+                                            Id {
+                                                value: 3,
+                                            },
+                                        ),
+                                        data: Number(
+                                            OrderedFloat(
+                                                2.0,
+                                            ),
+                                        ),
+                                    },
+                                ),
+                            },
                        ),
-                    ),
-                ),
-            ],
+                    },
+                ],
+            },
            [],
        )&quot;#]];
    expected.assert_eq(&amp;actual);
--- a/tutorial/ir.html
+++ b/tutorial/ir.html
@ -209,10 +209,39 @@ as explained in <a href="../overview.html#goal-of-salsa">the overview</a>.
 When you change the value of an input field, that increments a 'revision counter' in the database,
 indicating that some inputs are different now.
 When we talk about a &quot;revision&quot; of the database, we are referring to the state of the database in between changes to the input values.</p>
-<h2 id="tracked-structs"><a class="header" href="#tracked-structs">Tracked structs</a></h2>
-<p>Next we will define a <strong>tracked struct</strong> to represent the functions in our input.
-Whereas inputs represent the <em>start</em> of a computation, tracked structs represent intermediate values created during your computation.
-In this case, we are going to parse the raw input program, and create a <code>Function</code> for each of the functions defined by the user.</p>
+<h3 id="representing-the-parsed-program"><a class="header" href="#representing-the-parsed-program">Representing the parsed program</a></h3>
+<p>Next we will define a <strong>tracked struct</strong>.
+Whereas inputs represent the <em>start</em> of a computation, tracked structs represent intermediate values created during your computation.</p>
+<p>In this case, the parser is going to take in the <code>SourceProgram</code> struct that we saw and return a <code>Program</code> that represents the fully parsed program:</p>
+<pre><pre class="playground"><code class="language-rust">
+<span class="boring">#![allow(unused)]
+</span><span class="boring">fn main() {
+</span>#[salsa::tracked]
+pub struct Program {
+    #[return_ref]
+    statements: Vec&lt;Statement&gt;,
+}
+<span class="boring">}
+</span></code></pre></pre>
+<p>Like with an input, the fields of a tracked struct are also stored in the database.
+Unlike an input, those fields are immutable (they cannot be &quot;set&quot;), and salsa compares them across revisions to know when they have changed.
+In this case, if parsing the input produced the same <code>Program</code> result (e.g., because the only change to the input was some trailing whitespace, perhaps),
+then subsequent parts of the computation won't need to re-execute.
+(We'll revisit the role of tracked structs in reuse more in future parts of the IR.)</p>
+<p>Apart from the fields being immutable, the API for working with a tracked struct is quite similar to an input:</p>
+<ul>
+<li>You can create a new value by using <code>new</code>, but with a tracked struct, you only need an <code>&amp;dyn</code> database, not <code>&amp;mut</code> (e.g., <code>Program::new(&amp;db, some_staements)</code>)</li>
+<li>You use a getter to read the value of a field, just like with an input (e.g., <code>my_func.statements(db)</code> to read the <code>statements</code> field).
+<ul>
+<li>In this case, the field is tagged as <code>#[return_ref]</code>, which means that the getter will return a <code>&amp;Vec&lt;Statement&gt;</code>, instead of cloning the vector.</li>
+</ul>
+</li>
+</ul>
+<h2 id="representing-functions"><a class="header" href="#representing-functions">Representing functions</a></h2>
+<p>We will also use a tracked struct to represent each function:
+Next we will define a <strong>tracked struct</strong>.
+Whereas inputs represent the <em>start</em> of a computation, tracked structs represent intermediate values created during your computation.</p>
+<p>The <code>Function</code> struct is going to be created by the parser to represent each of the functions defined by the user:</p>
 <pre><pre class="playground"><code class="language-rust">
 <span class="boring">#![allow(unused)]
 </span><span class="boring">fn main() {
@ -220,12 +249,24 @@ In this case, we are going to parse the raw input program, and create a <code>Fu
 pub struct Function {
    #[id]
    name: FunctionId,
+
+    name_span: Span,
+
+    #[return_ref]
    args: Vec&lt;VariableId&gt;,
+
+    #[return_ref]
    body: Expression,
 }
 <span class="boring">}
 </span></code></pre></pre>
-<p>Unlike with inputs, the fields of tracked structs are immutable once created. Otherwise, working with a tracked struct is quite similar to an input:</p>
+<p>Like with an input, the fields of a tracked struct are also stored in the database.
+Unlike an input, those fields are immutable (they cannot be &quot;set&quot;), and salsa compares them across revisions to know when they have changed.
+If we had created some <code>Function</code> instance <code>f</code>, for example, we might find that <code>the f.body</code> field changes
+because the user changed the definition of <code>f</code>.
+This would mean that we have to re-execute those parts of the code that depended on <code>f.body</code>
+(but not those parts of the code that depended on the body of <em>other</em> functions).</p>
+<p>Apart from the fields being immutable, the API for working with a tracked struct is quite similar to an input:</p>
 <ul>
 <li>You can create a new value by using <code>new</code>, but with a tracked struct, you only need an <code>&amp;dyn</code> database, not <code>&amp;mut</code> (e.g., <code>Function::new(&amp;db, some_name, some_args, some_body)</code>)</li>
 <li>You use a getter to read the value of a field, just like with an input (e.g., <code>my_func.args(db)</code> to read the <code>args</code> field).</li>
@ -270,17 +311,26 @@ let f2 = FunctionId::new(&amp;db, &quot;my_string&quot;.to_string());
 assert_eq!(f1, f2);
 <span class="boring">}
 </span></code></pre></pre>
+<h3 id="interned-ids-are-guaranteed-to-be-consistent-within-a-revision-but-not-across-revisions-but-you-dont-have-to-care"><a class="header" href="#interned-ids-are-guaranteed-to-be-consistent-within-a-revision-but-not-across-revisions-but-you-dont-have-to-care">Interned ids are guaranteed to be consistent within a revision, but not across revisions (but you don't have to care)</a></h3>
+<p>Interned ids are guaranteed not to change within a single revision, so you can intern things from all over your program and get back consistent results.
+When you change the inputs, however, salsa may opt to clear some of the interned values and choose different integers.
+However, if this happens, it will also be sure to re-execute every function that interned that value, so all of them still see a consistent value,
+just a different one than they saw in a previous revision.</p>
+<p>In other words, within a salsa computation, you can assume that interning produces a single consistent integer, and you don't have to think about it.
+If however you export interned identifiers outside the computation, and then change the inputs, they may not longer be valid or may refer to different values.</p>
 <h3 id="expressions-and-statements"><a class="header" href="#expressions-and-statements">Expressions and statements</a></h3>
-<p>We'll also intern expressions and statements. This is convenient primarily because it allows us to have recursive structures very easily. Since we don't really need the &quot;cheap equality comparison&quot; aspect of interning, this isn't the most efficient choice, and many compilers would opt to represent expressions/statements in some other way.</p>
+<p>We'll won't use any special &quot;salsa structs&quot; for expressions and statements:</p>
 <pre><pre class="playground"><code class="language-rust">
 <span class="boring">#![allow(unused)]
 </span><span class="boring">fn main() {
-</span>#[salsa::interned]
+</span>#[derive(Eq, PartialEq, Debug, Hash, new)]
 pub struct Statement {
-    data: StatementData,
+    pub span: Span,
+
+    pub data: StatementData,
 }

-#[derive(Eq, PartialEq, Clone, Hash)]
+#[derive(Eq, PartialEq, Debug, Hash)]
 pub enum StatementData {
    /// Defines `fn &lt;name&gt;(&lt;args&gt;) = &lt;body&gt;`
    Function(Function),
@ -288,15 +338,16 @@ pub enum StatementData {
    Print(Expression),
 }

-#[salsa::interned]
+#[derive(Eq, PartialEq, Debug, Hash, new)]
 pub struct Expression {
-    #[return_ref]
-    data: ExpressionData,
+    pub span: Span,
+
+    pub data: ExpressionData,
 }

-#[derive(Eq, PartialEq, Clone, Hash)]
+#[derive(Eq, PartialEq, Debug, Hash)]
 pub enum ExpressionData {
-    Op(Expression, Op, Expression),
+    Op(Box&lt;Expression&gt;, Op, Box&lt;Expression&gt;),
    Number(OrderedFloat&lt;f64&gt;),
    Variable(VariableId),
    Call(FunctionId, Vec&lt;Expression&gt;),
@ -311,13 +362,10 @@ pub enum Op {
 }
 <span class="boring">}
 </span></code></pre></pre>
-<h3 id="interned-ids-are-guaranteed-to-be-consistent-within-a-revision-but-not-across-revisions-but-you-dont-have-to-care"><a class="header" href="#interned-ids-are-guaranteed-to-be-consistent-within-a-revision-but-not-across-revisions-but-you-dont-have-to-care">Interned ids are guaranteed to be consistent within a revision, but not across revisions (but you don't have to care)</a></h3>
-<p>Interned ids are guaranteed not to change within a single revision, so you can intern things from all over your program and get back consistent results.
-When you change the inputs, however, salsa may opt to clear some of the interned values and choose different integers.
-However, if this happens, it will also be sure to re-execute every function that interned that value, so all of them still see a consistent value,
-just a different one than they saw in a previous revision.</p>
-<p>In other words, within a salsa computation, you can assume that interning produces a single consistent integer, and you don't have to think about it.
-If however you export interned identifiers outside the computation, and then change the inputs, they may not longer be valid or may refer to different values.</p>
+<p>Since statements and expressions are not tracked, this implies that we are only attempting to get incremental re-use at the granularity of functions --
+whenever anything in a function body changes, we consider the entire function body dirty and re-execute anything that depended on it.
+It usually makes sense to draw some kind of &quot;reasonably coarse&quot; boundary like this.</p>
+<p>One downside of the way we have set things up: we inlined the position into each of the structs.</p>

                    </main>

--- a/tutorial/jar.html
+++ b/tutorial/jar.html
@ -164,14 +164,18 @@ This permits the crates to define private functions and other things that are me
 </span><span class="boring">fn main() {
 </span>#[salsa::jar(db = Db)]
 pub struct Jar(
+    crate::compile::compile,
    crate::ir::SourceProgram,
+    crate::ir::Program,
    crate::ir::VariableId,
    crate::ir::FunctionId,
-    crate::ir::Expression,
-    crate::ir::Statement,
    crate::ir::Function,
    crate::ir::Diagnostics,
+    crate::ir::Span,
    crate::parser::parse_statements,
+    crate::type_check::type_check_program,
+    crate::type_check::type_check_function,
+    crate::type_check::find_function,
 );
 <span class="boring">}
 </span></code></pre></pre>
--- a/tutorial/parser.html
+++ b/tutorial/parser.html
@ -158,8 +158,8 @@ We're going to focus only on the salsa-related aspects.</p>
 <pre><pre class="playground"><code class="language-rust">
 <span class="boring">#![allow(unused)]
 </span><span class="boring">fn main() {
-</span>#[salsa::tracked(return_ref)]
-pub fn parse_statements(db: &amp;dyn crate::Db, source: SourceProgram) -&gt; Vec&lt;Statement&gt; {
+</span>#[salsa::tracked]
+pub fn parse_statements(db: &amp;dyn crate::Db, source: SourceProgram) -&gt; Program {
    // Get the source text from the database
    let source_text = source.text(db);

@ -193,7 +193,7 @@ pub fn parse_statements(db: &amp;dyn crate::Db, source: SourceProgram) -&gt; Vec
        }
    }

-    result
+    Program::new(db, result)
 }
 <span class="boring">}
 </span></code></pre></pre>