From aeb6d1999a8fd2d959a5c4b4b5367f76a58159b4 Mon Sep 17 00:00:00 2001
From: fmoletta <99273364+fmoletta@users.noreply.github.com>
Date: Tue, 6 Feb 2024 15:20:22 +0200
Subject: [PATCH] [Cairo1] Append return values to the output segment when
 running in proof_mode (#1597)

* Force an output builtin to be present when running in proof_mode

* Vm changes

* Minor progress + notes

* Append last return value to the output segment in the proof_mode header

* remove handling that is confusing/not needed

* Extend solution to more than one return value

* Remove block of comment

* Update comments

* Add test that was removed when merged

* Skip output builtin in special final stack method

* Manually set the output builtin's segment size

* Move previous solution to where it is needed

* fmt + Improve comments

* Restore comment

* Improve spelling

* Add changelog entry

* Restore fuzzer/Cargo.lock
---
 CHANGELOG.md                               |  4 +
 cairo1-run/src/main.rs                     | 88 ++++++++++++++++++++--
 vm/src/vm/runners/builtin_runner/output.rs |  4 +
 vm/src/vm/vm_core.rs                       | 11 +++
 4 files changed, 101 insertions(+), 6 deletions(-)
diff --git a/CHANGELOG.md b/CHANGELOG.md
index b141e2de08..ebbe3dfca1 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -2,6 +2,10 @@
 
 #### Upcoming Changes
 
+* feat: Append return values to the output segment when running cairo1-run in proof_mode [#1597](https://github.com/lambdaclass/cairo-vm/pull/1597)
+  * Add instructions to the proof_mode header to copy return values to the output segment before initiating the infinite loop
+  * Output builtin is now always included when running cairo 1 programs in proof_mode
+
 * feat(BREAKING): Remove unecessary conversion functions between `Felt` & `BigUint`/`BigInt` [#1562](https://github.com/lambdaclass/cairo-vm/pull/1562)
   * Remove the following functions:
     * felt_from_biguint
diff --git a/cairo1-run/src/main.rs b/cairo1-run/src/main.rs
index 35e7932706..6c0214d7f7 100644
--- a/cairo1-run/src/main.rs
+++ b/cairo1-run/src/main.rs
@@ -290,6 +290,17 @@ fn run(args: impl Iterator<Item = String>) -> Result<Option<String>, Error> {
     // Get the user program instructions
     let program_instructions = casm_program.instructions.iter();
 
+    // Fetch return type data
+    let return_type_id = main_func
+        .signature
+        .ret_types
+        .last()
+        .ok_or(Error::NoRetTypesInSignature)?;
+    let return_type_size = type_sizes
+        .get(return_type_id)
+        .cloned()
+        .ok_or_else(|| Error::NoTypeSizeForId(return_type_id.clone()))?;
+
     // This footer is used by lib funcs
     let libfunc_footer = create_code_footer();
 
@@ -299,11 +310,34 @@ fn run(args: impl Iterator<Item = String>) -> Result<Option<String>, Error> {
         // This information can be useful for the users using the prover.
         println!("Builtins used: {:?}", builtins);
 
-        // Prepare "canonical" proof mode instructions. These are usually added by the compiler in cairo 0
+        // Create proof_mode specific instructions
+        // Including the "canonical" proof mode instructions (the ones added by the compiler in cairo 0)
+        // wich call the firt program instruction and then initiate an infinite loop.
+        // And also appending the return values to the output builtin's memory segment
+
+        // As the output builtin is not used by cairo 1 (we forced it for this purpose), it's segment is always empty
+        // so we can start writing values directly from it's base, which is located relative to the fp before the other builtin's bases
+        let output_fp_offset: i16 = -(builtins.len() as i16 + 2); // The 2 here represents the return_fp & end segments
+
+        // The pc offset where the original program should start
+        // Without this header it should start at 0, but we add 2 for each call and jump instruction (as both of them use immediate values)
+        // and also 1 for each instruction added to copy each return value into the output segment
+        let program_start_offset: i16 = 4 + return_type_size;
+
         let mut ctx = casm! {};
         casm_extend! {ctx,
-            call rel 4;
-            jmp rel 0;
+            call rel program_start_offset; // Begin program execution by calling the first instruction in the original program
+        };
+        // Append each return value to the output segment
+        for (i, j) in (1..return_type_size + 1).rev().enumerate() {
+            casm_extend! {ctx,
+                // [ap -j] is where each return value is located in memory
+                // [[fp + output_fp_offet] + 0] is the base of the output segment
+                [ap - j] = [[fp + output_fp_offset] + i as i16];
+            };
+        }
+        casm_extend! {ctx,
+            jmp rel 0; // Infinite loop
         };
         ctx.instructions
     } else {
@@ -316,7 +350,7 @@ fn run(args: impl Iterator<Item = String>) -> Result<Option<String>, Error> {
         proof_mode_header.iter(),
         entry_code.iter(),
         program_instructions,
-        libfunc_footer.iter()
+        libfunc_footer.iter(),
     );
 
     let (processor_hints, program_hints) = build_hints_vec(instructions.clone());
@@ -376,6 +410,13 @@ fn run(args: impl Iterator<Item = String>) -> Result<Option<String>, Error> {
 
     // Run it until the end/ infinite loop in proof_mode
     runner.run_until_pc(end, &mut vm, &mut hint_processor)?;
+    if args.proof_mode {
+        // As we will be inserting the return values into the output segment after running the main program (right before the infinite loop) the computed size for the output builtin will be 0
+        // We need to manually set the segment size for the output builtin's segment so memory hole counting doesn't fail due to having a higher accessed address count than the segment's size
+        vm.segments
+            .segment_sizes
+            .insert(2, return_type_size as usize);
+    }
     runner.end_run(false, false, &mut vm, &mut hint_processor)?;
 
     // Fetch return type data
@@ -470,11 +511,18 @@ fn run(args: impl Iterator<Item = String>) -> Result<Option<String>, Error> {
             }
             stack_pointer.offset += size as usize;
         }
+
         // Set stop pointer for each builtin
-        vm.builtins_final_stack_from_stack_pointer_dict(&builtin_name_to_stack_pointer)?;
+        vm.builtins_final_stack_from_stack_pointer_dict(
+            &builtin_name_to_stack_pointer,
+            args.proof_mode,
+        )?;
 
         // Build execution public memory
         if args.proof_mode {
+            // As the output builtin is not used by the program we need to compute it's stop ptr manually
+            vm.set_output_stop_ptr_offset(return_type_size as usize);
+
             runner.finalize_segments(&mut vm)?;
         }
     }
@@ -661,7 +709,8 @@ fn create_entry_code(
 ) -> Result<(Vec<Instruction>, Vec<BuiltinName>), Error> {
     let mut ctx = casm! {};
     // The builtins in the formatting expected by the runner.
-    let (builtins, builtin_offset) = get_function_builtins(func);
+    let (builtins, builtin_offset) = get_function_builtins(func, proof_mode);
+
     // Load all vecs to memory.
     // Load all array args content to memory.
     let mut array_args_data = vec![];
@@ -831,8 +880,21 @@ fn create_metadata(
     }
 }
 
+/// Type representing the Output builtin.
+#[derive(Default)]
+pub struct OutputType {}
+impl cairo_lang_sierra::extensions::NoGenericArgsGenericType for OutputType {
+    const ID: cairo_lang_sierra::ids::GenericTypeId =
+        cairo_lang_sierra::ids::GenericTypeId::new_inline("Output");
+    const STORABLE: bool = true;
+    const DUPLICATABLE: bool = false;
+    const DROPPABLE: bool = false;
+    const ZERO_SIZED: bool = false;
+}
+
 fn get_function_builtins(
     func: &Function,
+    proof_mode: bool,
 ) -> (
     Vec<BuiltinName>,
     HashMap<cairo_lang_sierra::ids::GenericTypeId, i16>,
@@ -880,6 +942,12 @@ fn get_function_builtins(
     {
         builtins.push(BuiltinName::pedersen);
         builtin_offset.insert(PedersenType::ID, current_offset);
+        current_offset += 1;
+    }
+    // Force an output builtin so that we can write the program output into it's segment
+    if proof_mode {
+        builtins.push(BuiltinName::output);
+        builtin_offset.insert(OutputType::ID, current_offset);
     }
     builtins.reverse();
     (builtins, builtin_offset)
@@ -1102,6 +1170,14 @@ mod tests {
         assert_matches!(run(args), Ok(Some(res)) if res == "12");
     }
 
+    #[rstest]
+    #[case(["cairo1-run", "../cairo_programs/cairo-1-programs/struct_span_return.cairo", "--print_output", "--trace_file", "/dev/null", "--memory_file", "/dev/null", "--layout", "all_cairo", "--cairo_pie_output", "/dev/null"].as_slice())]
+    #[case(["cairo1-run", "../cairo_programs/cairo-1-programs/struct_span_return.cairo", "--print_output", "--trace_file", "/dev/null", "--memory_file", "/dev/null", "--layout", "all_cairo", "--proof_mode", "--air_public_input", "/dev/null", "--air_private_input", "/dev/null"].as_slice())]
+    fn test_struct_span_return(#[case] args: &[&str]) {
+        let args = args.iter().cloned().map(String::from);
+        assert_matches!(run(args), Ok(Some(res)) if res == "[[4 3] [2 1]]");
+    }
+
     #[rstest]
     #[case(["cairo1-run", "../cairo_programs/cairo-1-programs/with_input/tensor.cairo", "--print_output", "--trace_file", "/dev/null", "--memory_file", "/dev/null", "--layout", "all_cairo", "--cairo_pie_output", "/dev/null", "--args", "[2 2] [1 2 3 4]"].as_slice())]
     #[case(["cairo1-run", "../cairo_programs/cairo-1-programs/with_input/tensor.cairo", "--print_output", "--trace_file", "/dev/null", "--memory_file", "/dev/null", "--layout", "all_cairo", "--proof_mode", "--air_public_input", "/dev/null", "--air_private_input", "/dev/null", "--args", "[2 2] [1 2 3 4]"].as_slice())]
diff --git a/vm/src/vm/runners/builtin_runner/output.rs b/vm/src/vm/runners/builtin_runner/output.rs
index 1e3bfe3ad4..c774bb330d 100644
--- a/vm/src/vm/runners/builtin_runner/output.rs
+++ b/vm/src/vm/runners/builtin_runner/output.rs
@@ -114,6 +114,10 @@ impl OutputBuiltinRunner {
             attributes: HashMap::default(),
         })
     }
+
+    pub(crate) fn set_stop_ptr_offset(&mut self, offset: usize) {
+        self.stop_ptr = Some(offset)
+    }
 }
 
 impl Default for OutputBuiltinRunner {
diff --git a/vm/src/vm/vm_core.rs b/vm/src/vm/vm_core.rs
index 38be9b1281..4def25700f 100644
--- a/vm/src/vm/vm_core.rs
+++ b/vm/src/vm/vm_core.rs
@@ -1082,8 +1082,12 @@ impl VirtualMachine {
     pub fn builtins_final_stack_from_stack_pointer_dict(
         &mut self,
         builtin_name_to_stack_pointer: &HashMap<&'static str, Relocatable>,
+        skip_output: bool,
     ) -> Result<(), RunnerError> {
         for builtin in self.builtin_runners.iter_mut() {
+            if matches!(builtin, BuiltinRunner::Output(_)) && skip_output {
+                continue;
+            }
             builtin.final_stack(
                 &self.segments,
                 builtin_name_to_stack_pointer
@@ -1094,6 +1098,13 @@ impl VirtualMachine {
         }
         Ok(())
     }
+
+    #[doc(hidden)]
+    pub fn set_output_stop_ptr_offset(&mut self, offset: usize) {
+        if let Some(BuiltinRunner::Output(builtin)) = self.builtin_runners.first_mut() {
+            builtin.set_stop_ptr_offset(offset)
+        }
+    }
 }
 
 pub struct VirtualMachineBuilder {