upload result plot

add homework11
add homework10
2025-12-06 17:52:50 -05:00 · 2025-12-06 17:52:21 -05:00 · 2025-11-23 16:16:53 -05:00 · 2025-11-12 19:58:02 -05:00 · 2025-11-10 20:23:08 -05:00 · 2025-11-05 11:03:28 -05:00
38 changed files with 1589 additions and 33 deletions
--- a/.gitignore
+++ b/.gitignore
@@ -1 +1,5 @@
-.vscode
+.vscode
+.DS_Store
+__pycache__
+*.pyc
+*Zone.Identifier
--- a/homework10/Homework10_Q1.py
+++ b/homework10/Homework10_Q1.py
@@ -0,0 +1,249 @@
+import numpy as np
+import matplotlib.pyplot as plt
+import sys
+
+# Configuration for plotting
+plt.style.use('seaborn-v0_8')
+plt.rcParams['figure.figsize'] = (18, 6)
+
+def newton_method(f, df, x0, tolerance=1e-12, max_iter=20):
+    """
+    Implements Newton's Method with overflow protection.
+    Returns: list of iteration history [(iter, x, error)]
+    """
+    history = []
+    x = x0
+    
+    for i in range(max_iter):
+        try:
+            # Check for divergence first
+            if abs(x) > 1e100:
+                break
+
+            fx = f(x)
+            dfx = df(x)
+            
+            if abs(dfx) < 1e-15: # Avoid division by zero
+                break
+                
+            history.append(x)
+            
+            x_new = x - fx / dfx
+            
+            # Check convergence
+            if abs(x_new - x) < tolerance:
+                x = x_new
+                history.append(x)
+                break
+                
+            x = x_new
+        except OverflowError:
+            # Catch errors if numbers become too large
+            break
+        
+    return history
+
+def chord_method(f, df_x0, x0, tolerance=1e-12, max_iter=50):
+    """
+    Implements Chord Method using fixed slope m = f'(x0) with overflow protection.
+    Returns: list of iteration history
+    """
+    history = []
+    x = x0
+    m = df_x0 # Fixed slope
+    
+    for i in range(max_iter):
+        try:
+            if abs(x) > 1e100:
+                break
+                
+            fx = f(x)
+            history.append(x)
+            
+            if abs(m) < 1e-15:
+                break
+                
+            x_new = x - fx / m
+            
+            if abs(x_new - x) < tolerance:
+                x = x_new
+                history.append(x)
+                break
+            x = x_new
+        except OverflowError:
+            break
+            
+    return history
+
+def secant_method(f, x0, x_minus_1, tolerance=1e-12, max_iter=20):
+    """
+    Implements Secant Method with overflow protection.
+    Returns: list of iteration history
+    """
+    history = []
+    x_curr = x0
+    x_prev = x_minus_1
+    
+    for i in range(max_iter):
+        try:
+            if abs(x_curr) > 1e100:
+                break
+
+            history.append(x_curr)
+            
+            fx_curr = f(x_curr)
+            fx_prev = f(x_prev)
+            
+            if abs(fx_curr - fx_prev) < 1e-15:
+                break
+                
+            # Secant update
+            x_new = x_curr - fx_curr * (x_curr - x_prev) / (fx_curr - fx_prev)
+            
+            if abs(x_new - x_curr) < tolerance:
+                x_curr = x_new
+                history.append(x_curr)
+                break
+                
+            x_prev = x_curr
+            x_curr = x_new
+        except OverflowError:
+            break
+        
+    return history
+
+def solve_and_save():
+    # Definition of problems
+    problems = [
+        {
+            'id': 'a',
+            'title': r'$f(x) = \cos(x) - x, x_0 = 0.5$',
+            'func_name': 'cos(x) - x',
+            'f': lambda x: np.cos(x) - x,
+            'df': lambda x: -np.sin(x) - 1,
+            'x0': 0.5,
+            'true_root': 0.73908513321516064165531208767387340401341175890075746496568063577328465488354759 # From wolframalpha 
+        },
+        {
+            'id': 'b',
+            'title': r'$f(x) = \sin(x), x_0 = 3$',
+            'func_name': 'sin(x)',
+            'f': lambda x: np.sin(x),
+            'df': lambda x: np.cos(x),
+            'x0': 3.0,
+            'true_root': np.pi
+        },
+        {
+            'id': 'c',
+            'title': r'$f(x) = x^2 + 1, x_0 = 0.5$',
+            'func_name': 'x^2 + 1',
+            'f': lambda x: x**2 + 1,
+            'df': lambda x: 2*x,
+            'x0': 0.5,
+            'true_root': None # No real root
+        }
+    ]
+    
+    # Open file for writing text results
+    output_filename = 'numerical_results.txt'
+    image_filename = 'convergence_results.png'
+    
+    with open(output_filename, 'w', encoding='utf-8') as txt_file:
+        
+        fig, axes = plt.subplots(1, 3)
+        
+        for idx, prob in enumerate(problems):
+            header_str = f"\n{'='*60}\nProblem ({prob['id']}): {prob['func_name']}, x0={prob['x0']}\n{'='*60}\n"
+            print(header_str) # Print to console to show progress
+            txt_file.write(header_str)
+            
+            x0 = prob['x0']
+            f = prob['f']
+            df = prob['df']
+            
+            # 1. Run Newton
+            hist_newton = newton_method(f, df, x0)
+            
+            # 2. Run Chord (m = f'(x0))
+            hist_chord = chord_method(f, df(x0), x0)
+            
+            # 3. Run Secant (x_-1 = 0.99 * x0)
+            x_minus_1 = 0.99 * x0
+            hist_secant = secant_method(f, x0, x_minus_1)
+            
+            methods_data = {
+                "Newton": hist_newton,
+                "Chord": hist_chord,
+                "Secant": hist_secant
+            }
+            
+            ax = axes[idx]
+            
+            for m_name, history in methods_data.items():
+                iters = list(range(len(history)))
+                errors = []
+                
+                # Calculate errors for plotting
+                # Note: Handling overflow for plotting large errors in problem c
+                for x in history:
+                    try:
+                        if prob['true_root'] is not None:
+                            val = abs(x - prob['true_root'])
+                        else:
+                            val = abs(f(x)) # Residual for problem c
+                        errors.append(val)
+                    except OverflowError:
+                        errors.append(float('inf'))
+
+                # Write to TXT file
+                txt_file.write(f"\nMethod: {m_name}\n")
+                txt_file.write(f"{'Iter':<5} | {'Value (x_k)':<25} | {'Error/Resid':<25}\n")
+                txt_file.write("-" * 60 + "\n")
+                
+                for i, val in enumerate(history):
+                    # Only write full history if short, or head/tail if long
+                    if len(history) < 20 or i < 5 or i > len(history) - 3:
+                        if prob['true_root'] is not None:
+                            err_val = abs(val - prob['true_root'])
+                        else:
+                            try:
+                                err_val = abs(f(val))
+                            except OverflowError:
+                                err_val = float('inf')
+                                
+                        txt_file.write(f"{i:<5} | {val:<25.10g} | {err_val:<25.6e}\n")
+                    elif i == 5:
+                        txt_file.write("...\n")
+
+                # Add to plot
+                if prob['true_root'] is not None:
+                    ylabel_text = "Error |x_k - x*|"
+                    log_scale = True
+                    ax.plot(iters, errors, marker='o', label=m_name)
+                else:
+                    ylabel_text = "Residual |f(x_k)|"
+                    log_scale = False
+                    # For problem C, data explodes, so we limit plotting range to avoid ruining the graph
+                    valid_errors = [e for e in errors if e < 1e10]
+                    valid_iters = iters[:len(valid_errors)]
+                    ax.plot(valid_iters, valid_errors, marker='x', label=m_name)
+
+            ax.set_title(f"Problem ({prob['id']})\n{prob['title']}")
+            ax.set_xlabel("Iteration")
+            ax.set_ylabel(ylabel_text)
+            if log_scale:
+                ax.set_yscale('log')
+            ax.legend()
+            if prob['id'] == 'c':
+                ax.set_ylim(0, 20)
+                ax.set_xticks(range(0, len(iters), 1))
+            ax.grid(True)
+
+    print(f"\nText results saved to: {output_filename}")
+    
+    plt.tight_layout()
+    plt.savefig(image_filename)
+    print(f"Chart saved to: {image_filename}")
+
+if __name__ == "__main__":
+    solve_and_save()
--- a/homework10/comment.txt
+++ b/homework10/comment.txt
@@ -0,0 +1 @@
+For problems (a) and (b), which have real roots, all methods converged; Newton's method was the fastest (quadratic), followed by the Secant method (superlinear), with the Chord method being the slowest (linear). However, for problem (c) (x^2 + 1), which has no real roots, all methods failed: the Chord method rapidly diverged to infinity, while Secant and Newton's method oscillated.
--- a/homework10/convergence_results.png
+++ b/homework10/convergence_results.png
--- a/homework10/numerical_results.txt
+++ b/homework10/numerical_results.txt
@@ -0,0 +1,112 @@
+
+============================================================
+Problem (a): cos(x) - x, x0=0.5
+============================================================
+
+Method: Newton
+Iter  | Value (x_k)               | Error/Resid              
+------------------------------------------------------------
+0     | 0.5                       | 2.390851e-01             
+1     | 0.7552224171              | 1.613728e-02             
+2     | 0.7391416661              | 5.653293e-05             
+3     | 0.7390851339              | 7.056461e-10             
+4     | 0.7390851332              | 0.000000e+00             
+5     | 0.7390851332              | 0.000000e+00             
+
+Method: Chord
+Iter  | Value (x_k)               | Error/Resid              
+------------------------------------------------------------
+0     | 0.5                       | 2.390851e-01             
+1     | 0.7552224171              | 1.613728e-02             
+2     | 0.7369022576              | 2.182876e-03             
+3     | 0.7393704622              | 2.853290e-04             
+4     | 0.7390476612              | 3.747205e-05             
+...          
+13    | 0.7390851332              | 4.333200e-13             
+14    | 0.7390851332              | 5.695444e-14             
+
+Method: Secant
+Iter  | Value (x_k)               | Error/Resid              
+------------------------------------------------------------
+0     | 0.5                       | 2.390851e-01             
+1     | 0.7556018135              | 1.651668e-02             
+2     | 0.738106944               | 9.781892e-04             
+3     | 0.7390815948              | 3.538433e-06             
+4     | 0.739085134               | 7.646579e-10             
+5     | 0.7390851332              | 5.551115e-16             
+6     | 0.7390851332              | 0.000000e+00             
+
+============================================================
+Problem (b): sin(x), x0=3.0
+============================================================
+
+Method: Newton
+Iter  | Value (x_k)               | Error/Resid              
+------------------------------------------------------------
+0     | 3                         | 1.415927e-01             
+1     | 3.142546543               | 9.538895e-04             
+2     | 3.141592653               | 2.893161e-10             
+3     | 3.141592654               | 0.000000e+00             
+4     | 3.141592654               | 0.000000e+00             
+
+Method: Chord
+Iter  | Value (x_k)               | Error/Resid              
+------------------------------------------------------------
+0     | 3                         | 1.415927e-01             
+1     | 3.142546543               | 9.538895e-04             
+2     | 3.141583011               | 9.642404e-06             
+3     | 3.141592751               | 9.747184e-08             
+4     | 3.141592653               | 9.853101e-10             
+5     | 3.141592654               | 9.960477e-12             
+6     | 3.141592654               | 1.003642e-13             
+7     | 3.141592654               | 1.332268e-15             
+
+Method: Secant
+Iter  | Value (x_k)               | Error/Resid              
+------------------------------------------------------------
+0     | 3                         | 1.415927e-01             
+1     | 3.142873442               | 1.280788e-03             
+2     | 3.141588403               | 4.250744e-06             
+3     | 3.141592654               | 1.158629e-12             
+4     | 3.141592654               | 0.000000e+00             
+5     | 3.141592654               | 0.000000e+00             
+
+============================================================
+Problem (c): x^2 + 1, x0=0.5
+============================================================
+
+Method: Newton
+Iter  | Value (x_k)               | Error/Resid              
+------------------------------------------------------------
+0     | 0.5                       | 1.250000e+00             
+1     | -0.75                     | 1.562500e+00             
+2     | 0.2916666667              | 1.085069e+00             
+3     | -1.568452381              | 3.460043e+00             
+4     | -0.4654406117             | 1.216635e+00             
+...
+18    | -1.820817243              | 4.315375e+00             
+19    | -0.6358066524             | 1.404250e+00             
+
+Method: Chord
+Iter  | Value (x_k)               | Error/Resid              
+------------------------------------------------------------
+0     | 0.5                       | 1.250000e+00             
+1     | -0.75                     | 1.562500e+00             
+2     | -2.3125                   | 6.347656e+00             
+3     | -8.66015625               | 7.599831e+01             
+4     | -84.65846252              | 7.168055e+03             
+...  
+8     | -7.660265913e+30          | 5.867967e+61             
+9     | -5.867967385e+61          | 3.443304e+123            
+
+Method: Secant
+Iter  | Value (x_k)               | Error/Resid              
+------------------------------------------------------------
+0     | 0.5                       | 1.250000e+00             
+1     | -0.756281407              | 1.571962e+00             
+2     | 5.37745098                | 2.991698e+01             
+3     | -1.096446714              | 2.202195e+00             
+4     | -1.610857647              | 3.594862e+00             
+...
+18    | 0.3478146096              | 1.120975e+00             
+19    | -2.615940634              | 7.843145e+00             
--- a/homework11/Homework11_Q5.py
+++ b/homework11/Homework11_Q5.py
@@ -0,0 +1,159 @@
+import numpy as np
+import matplotlib.pyplot as plt
+
+# --- 1. Define Function, Gradient, and Hessian ---
+# Objective function: Rosenbrock function
+def objective_function(x):
+    x1, x2 = x[0], x[1]
+    return 100 * (x2 - x1**2)**2 + (1 - x1)**2
+
+# Gradient vector calculation
+def gradient(x):
+    x1, x2 = x[0], x[1]
+    df_dx1 = -400 * x1 * (x2 - x1**2) - 2 * (1 - x1)
+    df_dx2 = 200 * (x2 - x1**2)
+    return np.array([df_dx1, df_dx2])
+
+# Hessian matrix calculation
+def hessian(x):
+    x1, x2 = x[0], x[1]
+    d2f_dx1dx1 = -400 * (x2 - 3 * x1**2) + 2
+    d2f_dx1dx2 = -400 * x1
+    d2f_dx2dx1 = -400 * x1
+    d2f_dx2dx2 = 200
+    return np.array([[d2f_dx1dx1, d2f_dx1dx2], [d2f_dx2dx1, d2f_dx2dx2]])
+
+# --- 2. Backtracking Line Search ---
+def backtracking_line_search(x, p, grad, alpha_bar=1.0, rho=0.5, c1=1e-3):
+    """
+    Finds a step size alpha that satisfies the 1st Wolfe condition (Armijo condition).
+    Condition: f(x + alpha*p) <= f(x) + c1 * alpha * grad^T * p
+    """
+    alpha = alpha_bar
+    f_val = objective_function(x)
+    grad_dot_p = np.dot(grad, p)
+    
+    # Loop until condition is met
+    while objective_function(x + alpha * p) > f_val + c1 * alpha * grad_dot_p:
+        alpha *= rho
+        # Safety break to prevent infinite loops if alpha becomes too small
+        if alpha < 1e-16: 
+            break
+    return alpha
+
+# --- 3. Optimization Algorithms ---
+def run_optimization(method, x0, tol_ratio=1e-12, max_iter=20000):
+    """
+    Runs the specified optimization method.
+    Returns: list of alphas used, total iterations
+    """
+    x = x0.copy()
+    grad_0_norm = np.linalg.norm(gradient(x0))
+    
+    alphas = []
+    
+    print(f"[{method}] Starting from {x0}...")
+    
+    for i in range(max_iter):
+        grad = gradient(x)
+        grad_norm = np.linalg.norm(grad)
+        
+        # Convergence Check: ||grad f(xk)|| < 10^-12 * ||grad f(x0)||
+        if grad_norm < tol_ratio * grad_0_norm:
+            print(f"   -> Converged at iteration {i}. Final Loss: {objective_function(x):.6e}")
+            return alphas, i
+            
+        # Determine Search Direction
+        if method == "Steepest_Descent":
+            direction = -grad
+        elif method == "Newton":
+            hess = hessian(x)
+            try:
+                # Solve H * d = -g for d
+                direction = np.linalg.solve(hess, -grad) 
+            except np.linalg.LinAlgError:
+                # Fallback if Hessian is singular
+                direction = -grad
+
+        # Perform Backtracking Line Search
+        alpha = backtracking_line_search(x, direction, grad, alpha_bar=1.0, rho=0.5, c1=1e-3)
+        
+        # Update Position
+        x = x + alpha * direction
+        
+        alphas.append(alpha)
+        
+    print(f"   -> Did not converge within {max_iter} iterations.")
+    print(f"   -> Final Gradient Norm: {grad_norm:.6e}")
+    return alphas, max_iter
+
+# --- 4. Main Execution and Plotting ---
+
+# Configuration
+initial_points = [np.array([1.2, 1.2]), np.array([-1.2, 1.0])]
+methods = ["Steepest_Descent", "Newton"]
+
+# Dictionary to hold simulation results
+results = {}
+
+# Run simulations
+for x0 in initial_points:
+    for method in methods:
+        # Construct a unique key for storage
+        key = f"{method}_x0_{x0}"
+        alphas, num_iters = run_optimization(method, x0)
+        results[key] = {'alphas': alphas, 'iters': num_iters, 'x0': x0}
+
+# Plot configuration
+fig, axes = plt.subplots(2, 2, figsize=(14, 10))
+plt.subplots_adjust(hspace=0.4, wspace=0.3)
+
+# Mapping results to subplots
+plot_mapping = {
+    ("Steepest_Descent", str(initial_points[0])): (0, 0),
+    ("Newton", str(initial_points[0])): (0, 1),
+    ("Steepest_Descent", str(initial_points[1])): (1, 0),
+    ("Newton", str(initial_points[1])): (1, 1),
+}
+
+for key, data in results.items():
+    method_name = key.split("_x0_")[0]
+    x0_str = str(data['x0'])
+    
+    ax_idx = plot_mapping[(method_name, x0_str)]
+    ax = axes[ax_idx]
+    
+    y_data = data['alphas']
+    x_data = range(len(y_data))
+    
+    # --- PLOTTING LOGIC MODIFICATION ---
+    # For Steepest Descent, show only first {limit} steps
+    if method_name == "Steepest_Descent":
+        limit = 30
+        if len(y_data) > limit:
+            y_data = y_data[:limit]
+            x_data = range(limit)
+            title_suffix = f" (First {limit} Steps Shown)"
+        else:
+            title_suffix = ""
+    else:
+        title_suffix = ""
+        
+    ax.plot(x_data, y_data, marker='o', linestyle='-', markersize=4, linewidth=1.5)
+    
+    # Titles and Labels
+    ax.set_title(f"{method_name}\nStart: {data['x0']}\nTotal Iters: {data['iters']}{title_suffix}")
+    ax.set_xlabel("Iteration")
+    ax.set_ylabel("Step Size (Alpha)")
+    ax.grid(True, which='both', linestyle='--', alpha=0.7)
+    
+    # Add annotation for total iterations
+    ax.text(0.95, 0.95, f"Total Iters: {data['iters']}", 
+            transform=ax.transAxes, 
+            verticalalignment='top', horizontalalignment='right',
+            bbox=dict(boxstyle='round', facecolor='white', alpha=0.8))
+
+# Save and Show
+#plt.suptitle("Step Size vs Iteration (Rosenbrock Function)", fontsize=16)
+plt.savefig("optimization_results.png")
+#plt.show()
--- a/homework11/optimization_results.png
+++ b/homework11/optimization_results.png
--- a/homework8/Homework8_Q5.py
+++ b/homework8/Homework8_Q5.py
@@ -0,0 +1,81 @@
+import numpy as np
+import matplotlib.pyplot as plt
+
+# --- FUNCTION DEFINITION CORRECTED HERE ---
+def g(t):
+    """
+    Calculates g(t) = t^4 - 3t^3 + 2t^2 in a vectorized way.
+    It handles both single float inputs and NumPy array inputs.
+    If an element's absolute value is too large, it returns infinity
+    to prevent overflow and handle plotting of diverging paths.
+    """
+    # Use np.where for a vectorized if-else statement.
+    # This correctly handles both scalar and array inputs.
+    return np.where(np.abs(t) > 1e10,  # Condition
+                    np.inf,             # Value if condition is True
+                    t**4 - 3*t**3 + 2*t**2) # Value if condition is False
+
+# Define the gradient (derivative) of g(t)
+def grad_g(t):
+    # This function is only called with scalars in our loop,
+    # but it's good practice for it to be vectorization-safe as well.
+    # Standard arithmetic operations are already vectorized in NumPy.
+    return 4*t**3 - 9*t**2 + 4*t
+
+# Implement the gradient descent algorithm
+def gradient_descent(x0, alpha, iterations=100):
+    history = [x0]
+    x = x0
+    for _ in range(iterations):
+        grad = grad_g(x)
+        
+        if np.isinf(x) or np.isnan(x) or np.abs(x) > 1e9:
+            print(f"Divergence detected for alpha = {alpha}. Stopping early.")
+            break
+
+        x = x - alpha * grad
+        history.append(x)
+    if not np.isinf(x) and not np.isnan(x) and np.abs(x) <= 1e9:
+        print(f"Alpha: {alpha:<.2f}, Current x: {x:<.2f}, g(x): {g(x):<.2f}")
+    return history
+
+# --- Main part of the experiment ---
+
+# Set an initial point
+initial_xs = [-1.0, 0.5, 0.65, 2.5]
+
+# Define a list of different alpha values to test
+alphas_to_test = [0.05, 0.15, 0.25, 0.4, 0.5, 0.6]
+
+# Run the experiment for each alpha value and plot the results
+for initial_x in initial_xs:
+    print(f"Running gradient descent from initial x = {initial_x}")
+    # Create a plot
+    plt.figure(figsize=(14, 8))
+
+    # Plot the function g(t) for context
+    t_plot = np.linspace(-1.5, 3.5, 400)
+    plt.plot(t_plot, g(t_plot), 'k-', label='g(t) = t^4 - 3t^3 + 2t^2', linewidth=2)
+    for alpha in alphas_to_test:
+        history = gradient_descent(initial_x, alpha)
+        history_np = np.array(history)
+        plt.plot(history_np, g(history_np), 'o-', label=f'alpha = {alpha}', markersize=4, alpha=0.8)
+
+    # Add stationary points
+    minima1 = 0.0
+    minima2 = (9 + np.sqrt(17)) / 8
+    maxima = (9 - np.sqrt(17)) / 8
+    plt.plot(minima1, g(minima1), 'g*', markersize=15, label=f'Local Minimum at t={minima1:.2f}')
+    plt.plot(minima2, g(minima2), 'g*', markersize=15, label=f'Local Minimum at t≈{minima2:.2f}')
+    plt.plot(maxima, g(maxima), 'rX', markersize=10, label=f'Local Maximum at t≈{maxima:.2f}')
+
+    # Final plot formatting
+    plt.title('Gradient Descent Convergence for Different Step Sizes (alpha, initial x={})'.format(initial_x))
+    plt.xlabel('t')
+    plt.ylabel('g(t)')
+    plt.legend()
+    plt.grid(True)
+    plt.ylim(-1, 5)
+    plt.xlim(-1.5, 3.5)
+    plt.savefig(f'Homework8_Q5_Gradient_Descent_Convergence_x={initial_x}.png')
+
--- a/homework8/Homework8_Q5.txt
+++ b/homework8/Homework8_Q5.txt
@@ -0,0 +1,28 @@
+Running gradient descent from initial x = -1.0
+Alpha: 0.05, Current x: -0.00, g(x): 0.00
+Alpha: 0.15, Current x: 1.64, g(x): -0.62
+Divergence detected for alpha = 0.25. Stopping early.
+Divergence detected for alpha = 0.4. Stopping early.
+Divergence detected for alpha = 0.5. Stopping early.
+Divergence detected for alpha = 0.6. Stopping early.
+Running gradient descent from initial x = 0.5
+Alpha: 0.05, Current x: 0.00, g(x): 0.00
+Alpha: 0.15, Current x: 0.00, g(x): 0.00
+Alpha: 0.25, Current x: 0.00, g(x): 0.00
+Alpha: 0.40, Current x: -0.00, g(x): 0.00
+Alpha: 0.50, Current x: 0.02, g(x): 0.00
+Alpha: 0.60, Current x: 0.18, g(x): 0.05
+Running gradient descent from initial x = 0.65
+Alpha: 0.05, Current x: 1.64, g(x): -0.62
+Alpha: 0.15, Current x: 1.64, g(x): -0.62
+Alpha: 0.25, Current x: 1.64, g(x): -0.62
+Alpha: 0.40, Current x: 1.51, g(x): -0.57
+Alpha: 0.50, Current x: 0.01, g(x): 0.00
+Divergence detected for alpha = 0.6. Stopping early.
+Running gradient descent from initial x = 2.5
+Alpha: 0.05, Current x: 1.64, g(x): -0.62
+Alpha: 0.15, Current x: 0.00, g(x): 0.00
+Divergence detected for alpha = 0.25. Stopping early.
+Divergence detected for alpha = 0.4. Stopping early.
+Divergence detected for alpha = 0.5. Stopping early.
+Divergence detected for alpha = 0.6. Stopping early.
--- a/homework8/Homework8_Q5_Gradient_Descent_Convergence_x=-1.0.png
+++ b/homework8/Homework8_Q5_Gradient_Descent_Convergence_x=-1.0.png
--- a/homework8/Homework8_Q5_Gradient_Descent_Convergence_x=0.5.png
+++ b/homework8/Homework8_Q5_Gradient_Descent_Convergence_x=0.5.png
--- a/homework8/Homework8_Q5_Gradient_Descent_Convergence_x=0.65.png
+++ b/homework8/Homework8_Q5_Gradient_Descent_Convergence_x=0.65.png
--- a/homework8/Homework8_Q5_Gradient_Descent_Convergence_x=2.5.png
+++ b/homework8/Homework8_Q5_Gradient_Descent_Convergence_x=2.5.png
--- a/project1/Project1.md
+++ b/project1/Project1.md
@@ -16,15 +16,15 @@ As $\epsilon \rightarrow 0$, the normal equation method numerically unstable. A
 Results:
 | $\epsilon$ | Normal Equation Method `proj(A, b)` | SVD Method `proj_SVD(A, b)` | Difference (Normal Eq - SVD) |
 |:---:|:---|:---|:---|
-| **1.0** | `[1.85714286 1. 3.14285714 1.28571429 3.85714286]` | `[1.85714286 1. 3.14285714 1.28571429 3.85714286]` | `[ 1.78e-15 -2.22e-15 -8.88e-16 8.88e-16 0.00e+00]` |
-| **0.1** | `[1.85714286 1. 3.14285714 1.28571429 3.85714286]` | `[1.85714286 1. 3.14285714 1.28571429 3.85714286]` | `[ 7.28e-14 -4.44e-16 -2.66e-14 -1.62e-14 -5.28e-14]` |
-| **0.01** | `[1.85714286 1. 3.14285714 1.28571429 3.85714286]` | `[1.85714286 1. 3.14285714 1.28571429 3.85714286]` | `[-5.45e-12 -7.28e-12 -3.45e-13 -4.24e-12 -4.86e-12]` |
-| **1e-4** | `[1.85714297 1.00000012 3.14285716 1.28571442 3.85714302]` | `[1.85714286 1. 3.14285714 1.28571429 3.85714286]` | `[1.11e-07 1.19e-07 1.92e-08 1.36e-07 1.67e-07]` |
-| **1e-8** | **Error:** `LinAlgError: Singular matrix` | `[1.85714286 1. 3.14285714 1.28571428 3.85714286]` | `Could not compute difference due to previous error.` |
-| **1e-16**| **Error:** `ValueError: Matrix A must be full rank` | `[1.81820151 1. 3.18179849 2.29149804 2.89030045]` | `Could not compute difference due to previous error.` |
-| **1e-32**| **Error:** `ValueError: Matrix A must be full rank` | `[2. 1. 3. 2.5 2.5]` | `Could not compute difference due to previous error.` |
+| **1.0** | `[1.85714286 1. 3.14285714 1.28571429 3.85714286]` | `[1.85714286 1. 3.14285714 1.28571429 3.85714286]` | `[ 2.22e-16 1.55e-15 -4.44e-16 2.22e-16 -8.88e-16]` |
+| **0.1** | `[1.85714286 1. 3.14285714 1.28571429 3.85714286]` | `[1.85714286 1. 3.14285714 1.28571429 3.85714286]` | `[ 8.08e-14 5.87e-14 -8.88e-16 4.82e-14 -1.38e-14]` |
+| **0.01** | `[1.85714286 1. 3.14285714 1.28571429 3.85714286]` | `[1.85714286 1. 3.14285714 1.28571429 3.85714286]` | `[-4.77e-12 -1.84e-14 5.54e-13 -4.00e-12 1.50e-12]` |
+| **1e-4** | `[1.85714282 1. 3.14285716 1.28571427 3.85714291]` | `[1.85714286 1. 3.14285714 1.28571429 3.85714286]` | `[-3.60e-08 9.11e-13 1.94e-08 -1.20e-08 4.80e-08]` |
+| **1e-8** | `[-1.87500007 0.99999993 -3.12499997 -2.62500007 3.49999996]` | `[1.85714286 1. 3.14285714 1.28571427 3.85714286]` | `[-3.73e+00 -7.45e-08 -6.27e+00 -3.91e+00 -3.57e-01]` |
+| **1e-16**| **Error:** `ValueError: Matrix A must be full rank` | `[3.4 1. 1.6 1.8 1.8]` | `Could not compute difference due to previous error.` |
+| **1e-32**| **Error:** `ValueError: Matrix A must be full rank` | `[3.4 1. 1.6 1.8 1.8]` | `Could not compute difference due to previous error.` |

-Numerical experiments show that as $\epsilon$ becomes small, the difference between the two methods increases. When $\epsilon$ becomes very small (e.g., 1e-8), the normal equation method fails while the SVD method continues to provide a stable solution.
+Numerical experiments show that as $\epsilon$ becomes small, the difference between the two methods increases. When $\epsilon$ becomes very small (e.g., 1e-8), the normal equation method can't give a valid result and fails when $\epsilon$ continues to decrease (e.g., 1e-16), while the SVD method continues to provide a stable solution.

 ***

--- a/project1/Project1_A1.txt
+++ b/project1/Project1_A1.txt
@@ -4,8 +4,8 @@ Projection of b onto the column space of A(1): (Using proj function)
 Projection of b onto the column space of A(1): (Using proj_SVD function)
 [1.85714286 1.         3.14285714 1.28571429 3.85714286]
 Difference between the two methods:
-[ 1.77635684e-15 -2.22044605e-15 -8.88178420e-16  8.88178420e-16
-  0.00000000e+00]
+[ 2.22044605e-16  1.55431223e-15 -4.44089210e-16  2.22044605e-16
+ -8.88178420e-16]

 Question 1(b):

@@ -15,8 +15,8 @@ Projection of b onto the column space of A(1.0):
 Projection of b onto the column space of A(1.0) using SVD:
 [1.85714286 1.         3.14285714 1.28571429 3.85714286]
 Difference between the two methods:
-[ 1.77635684e-15 -2.22044605e-15 -8.88178420e-16  8.88178420e-16
-  0.00000000e+00]
+[ 2.22044605e-16  1.55431223e-15 -4.44089210e-16  2.22044605e-16
+ -8.88178420e-16]

 For ε = 0.1:
 Projection of b onto the column space of A(0.1):
@@ -24,8 +24,8 @@ Projection of b onto the column space of A(0.1):
 Projection of b onto the column space of A(0.1) using SVD:
 [1.85714286 1.         3.14285714 1.28571429 3.85714286]
 Difference between the two methods:
-[ 7.28306304e-14 -4.44089210e-16 -2.66453526e-14 -1.62092562e-14
- -5.28466160e-14]
+[ 8.08242362e-14  5.87307980e-14 -8.88178420e-16  4.81836793e-14
+ -1.37667655e-14]

 For ε = 0.01:
 Projection of b onto the column space of A(0.01):
@@ -33,35 +33,37 @@ Projection of b onto the column space of A(0.01):
 Projection of b onto the column space of A(0.01) using SVD:
 [1.85714286 1.         3.14285714 1.28571429 3.85714286]
 Difference between the two methods:
-[-5.45297141e-12 -7.28239691e-12 -3.44613227e-13 -4.24371649e-12
- -4.86499729e-12]
+[-4.76907402e-12 -1.84297022e-14  5.53779245e-13 -4.00324218e-12
+  1.49613655e-12]

 For ε = 0.0001:
 Projection of b onto the column space of A(0.0001):
-[1.85714297 1.00000012 3.14285716 1.28571442 3.85714302]
+[1.85714282 1.         3.14285716 1.28571427 3.85714291]
 Projection of b onto the column space of A(0.0001) using SVD:
 [1.85714286 1.         3.14285714 1.28571429 3.85714286]
 Difference between the two methods:
-[1.11406275e-07 1.19209290e-07 1.91642426e-08 1.35516231e-07
- 1.67459071e-07]
+[-3.59740875e-08  9.10937992e-13  1.94238092e-08 -1.19938544e-08
+  4.79721098e-08]

 For ε = 1e-08:
-LinAlgError for eps=1e-08: Singular matrix
+Projection of b onto the column space of A(1e-08):
+[-1.87500007  0.99999993 -3.12499997 -2.62500007  3.49999996]
 Projection of b onto the column space of A(1e-08) using SVD:
-[1.85714286 1.         3.14285714 1.28571428 3.85714286]
+[1.85714286 1.         3.14285714 1.28571427 3.85714286]
 Difference between the two methods:
-Could not compute difference due to previous error.
+[-3.73214294e+00 -7.45058057e-08 -6.26785711e+00 -3.91071435e+00
+ -3.57142909e-01]

 For ε = 1e-16:
 ValueError for eps=1e-16: Matrix A must be full rank.
 Projection of b onto the column space of A(1e-16) using SVD:
-[1.81820151 1.         3.18179849 2.29149804 2.89030045]
+[3.4 1.  1.6 1.8 1.8]
 Difference between the two methods:
 Could not compute difference due to previous error.

 For ε = 1e-32:
 ValueError for eps=1e-32: Matrix A must be full rank.
 Projection of b onto the column space of A(1e-32) using SVD:
-[2.  1.  3.  2.5 2.5]
+[3.4 1.  1.6 1.8 1.8]
 Difference between the two methods:
 Could not compute difference due to previous error.
--- a/project1/Project1_A3c_least_squares_approximation.png
+++ b/project1/Project1_A3c_least_squares_approximation.png
--- a/project1/Project1_A3d_least_squares_approximation.png
+++ b/project1/Project1_A3d_least_squares_approximation.png
--- a/project1/Project1_A3e_coefficient_error.png
+++ b/project1/Project1_A3e_coefficient_error.png
--- a/project1/Project1_Q1.py
+++ b/project1/Project1_Q1.py
@@ -38,9 +38,13 @@ def proj_SVD(A:np.ndarray, b:np.ndarray) -> np.ndarray:
    = U S V^* (V S^2 V^*)^(-1) V S U^* b
    = U S V^* V S^(-2) V^* V S U^* b
    = U U^* b
+    If A = U S V^*, then the projection onto the column space of A is:
+        proj_A(b) = U_r U_r^* b
+    where U_r are the left singular vectors corresponding to nonzero singular values.
    """
+    U_r = U[:, :np.linalg.matrix_rank(A)]  # Take only the relevant columns
    # Compute the projection using the SVD components
-    projection = U @ U.conj().T @ b
+    projection = U_r @ U_r.conj().T @ b
    return projection

 def build_A(eps: float) -> np.ndarray:
--- a/project1/Project1_Q3.py
+++ b/project1/Project1_Q3.py
@@ -73,18 +73,18 @@ def f1(t: float) -> float:
    """
    return 1.0 / (1.0 + t**2)

-def build_A(N: int, n: int, f: callable) -> tuple[np.ndarray, np.ndarray]:
+def build_A(N: int, n: int, f: callable, f_range: tuple) -> tuple[np.ndarray, np.ndarray]:
    """
    Build the matrix A for the least squares problem.
    
    Parameters:
    n + 1 (int): The number of columns in the matrix A.
-    
+    f_range (tuple): The range of the function f.
    Returns:
    np.ndarray: The constructed matrix A.
    """
    """
-    {t_j}j=0->N, t_0=-5, t_N=5, t_j divides [-5, 5] equally
+    {t_j}j=0->N, t_0=f_range[0], t_N=f_range[1], t_j divides [f_range[0], f_range[1]] equally
    A = [[1, t_0, t_0^2, t_0^3, ..., t_0^n],
        [1, t_1, t_1^2, t_1^3, ..., t_1^n],
        ...
@@ -95,7 +95,7 @@ def build_A(N: int, n: int, f: callable) -> tuple[np.ndarray, np.ndarray]:
    Ax = b, x is the coeffs of the polynomial
    """
    A = np.zeros((N + 1, n + 1), dtype=float)
-    t = np.linspace(-5, 5, N + 1)
+    t = np.linspace(f_range[0], f_range[1], N + 1)
    for i in range(N + 1):
        A[i, :] = [t[i]**j for j in range(n + 1)]
    b = np.array([f(t_i) for t_i in t])
@@ -113,7 +113,7 @@ def question_3c():
        N = Ns[i]
        n = ns[i]
        A = np.zeros((N + 1, n + 1), dtype=float)
-        A, b = build_A(N, n, f1)
+        A, b = build_A(N, n, f1, (-5, 5))
        x = householder_lstsq(A, b)
        p_t = sum([x[j] * t**j for j in range(n + 1)])
        plt.subplot(1, 3, i + 1)
@@ -135,6 +135,32 @@ def f2(n:int, t: float) -> float:
    """
    return sum([t**i for i in range(n + 1)])

+def question_3d():
+    Ns = [25, 50, 100]
+    ns = Ns
+    t = np.linspace(-5, 5, 1000)
+    f_t = f1(t)
+    plt.figure(figsize=(15, 10))
+    for i in range(len(Ns)):
+        N = Ns[i]
+        n = ns[i]
+        A = np.zeros((N + 1, n + 1), dtype=float)
+        A, b = build_A(N, n, f1, (-5, 5))
+        x = householder_lstsq(A, b)
+        p_t = sum([x[j] * t**j for j in range(n + 1)])
+        plt.subplot(1, 3, i + 1)
+        plt.plot(t, f_t, label='f(t)', color='blue')
+        plt.plot(t, p_t, label='p(t)', color='red', linestyle='--')
+        plt.title(f'N={N}, n={n}')
+        plt.xlabel('t')
+        plt.ylabel('y')
+        plt.legend()
+        plt.grid(True, alpha=0.3)
+    plt.suptitle('Least Squares Polynomial Approximation using Householder QR')
+    plt.tight_layout(rect=[0, 0.03, 1, 0.95])
+    plt.savefig('Project1_A3d_least_squares_approximation.png')
+    #plt.show()
+
 def question_3e():
    # n = 4, 6, 8, 10, ..., 20
    ns = list(range(4, 21, 2))
@@ -143,7 +169,7 @@ def question_3e():
    losses = []
    for n in ns:
        N = 2 * n
-        A, b = build_A(N, n, lambda t: f2(n, t))
+        A, b = build_A(N, n, lambda t: f2(n, t), (0, 1))
        x = householder_lstsq(A, b)
        true_coeffs = np.array([1.0 for _ in range(n + 1)])
        loss = np.linalg.norm(x - true_coeffs)
@@ -161,6 +187,7 @@ def question_3e():

 if __name__ == "__main__":
    question_3c()
+    question_3d()
    question_3e()


--- a/project1/README.md
+++ b/project1/README.md
@@ -6,7 +6,7 @@ conda activate math6601_env
 pip install -r requirements.txt
 ```

-### Question 1
+### Run programs

 ```bash
 python Project1_Q1.py > Project1_A1.txt
--- a/project1/main.tex
+++ b/project1/main.tex
@@ -0,0 +1,162 @@
+\documentclass{article}
+
+% Language setting
+\usepackage[english]{babel}
+
+% Set page size and margins
+\usepackage[letterpaper,top=2cm,bottom=2cm,left=3cm,right=3cm,marginparwidth=1.75cm]{geometry}
+
+% Useful packages
+\usepackage{amsmath}
+\usepackage{graphicx}
+\usepackage{amsfonts}
+\usepackage[colorlinks=true, allcolors=blue]{hyperref}
+\usepackage{array} % For better table column definitions
+
+\title{MATH 6601 - Project 1 Report}
+\author{Zhe Yuan (yuan.1435)}
+\date{Sep 2025}
+
+\begin{document}
+\maketitle
+
+\section{Projections}
+
+\subsection*{(a)}
+The projection of vector $b$ onto the column space of a full-rank matrix $A$ is given by $p=A(A^*A)^{-1}A^*b$. A function \texttt{proj(A, b)} was implemented based on this formula (see \texttt{Project1\_Q1.py}). For $\epsilon = 1$, the projection is:
+\begin{verbatim}
+p = [1.85714286, 1.0, 3.14285714, 1.28571429, 3.85714286]
+\end{verbatim}
+
+\subsection*{(b)}
+As $\epsilon \rightarrow 0$, the normal equation method becomes numerically unstable. A more robust SVD-based method, \texttt{proj\_SVD(A, b)}, was implemented to handle this (see \texttt{Project1\_Q1.py}). The results are summarized in Table~\ref{tab:proj_results}.
+
+\begin{table}[h!]
+\centering
+\small % Use a smaller font for the table
+\begin{tabular}{|c|>{\ttfamily}p{3cm}|>{\ttfamily}p{3cm}|p{3.5cm}|}
+\hline
+\textbf{$\epsilon$} & \textbf{Normal Equation Method \texttt{proj(A,b)}} & \textbf{SVD Method \texttt{proj\_SVD(A,b)}} & \textbf{Difference (Normal Eq - SVD)} \\
+\hline
+\textbf{1.0} & [1.85714286 1. 3.14285714 1.28571429 3.85714286] & [1.85714286 1. 3.14285714 1.28571429 3.85714286] & [ 2.22e-16  1.55e-15 -4.44e-16  2.22e-16 -8.88e-16] \\
+\hline
+\textbf{0.1} & [1.85714286 1. 3.14285714 1.28571429 3.85714286] & [1.85714286 1. 3.14285714 1.28571429 3.85714286] & [ 8.08e-14  5.87e-14 -8.88e-16  4.82e-14 -1.38e-14] \\
+\hline
+\textbf{0.01} & [1.85714286 1. 3.14285714 1.28571429 3.85714286] & [1.85714286 1. 3.14285714 1.28571429 3.85714286] & [-4.77e-12 -1.84e-14  5.54e-13 -4.00e-12  1.50e-12] \\
+\hline
+\textbf{1e-4} & [1.85714282 1. 3.14285716 1.28571427 3.85714291] & [1.85714286 1. 3.14285714 1.28571429 3.85714286] & [-3.60e-08  9.11e-13  1.94e-08 -1.20e-08  4.80e-08] \\
+\hline
+\textbf{1e-8} & [-1.87500007 0.99999993 -3.12499997 -2.62500007 3.49999996] & [1.85714286 1. 3.14285714 1.28571427 3.85714286] & [-3.73e+00 -7.45e-08 -6.27e+00 -3.91e+00 -3.57e-01] \\
+\hline
+\textbf{1e-16} & \textbf{Error:} \texttt{ValueError: Matrix A must be full rank} & [3.4 1. 1.6 1.8 1.8] & Could not compute difference due to previous error. \\
+\hline
+\textbf{1e-32} & \textbf{Error:} \texttt{ValueError: Matrix A must be full rank} & [3.4 1. 1.6 1.8 1.8] & Could not compute difference due to previous error. \\
+\hline
+\end{tabular}
+\caption{Comparison of results from the normal equation and SVD-based methods.}
+\label{tab:proj_results}
+\end{table}
+
+\noindent Numerical experiments show that as $\epsilon$ becomes small, the difference between the two methods increases. When $\epsilon$ becomes very small (e.g., 1e-8), the normal equation method can't give a valid result and fails when $\epsilon$ continues to decrease (e.g., 1e-16), while the SVD method continues to provide a stable solution.
+
+\section{QR Factorisation}
+
+\subsection*{(a, b, c)}
+Four QR factorization algorithms were implemented to find an orthonormal basis $Q$ for the column space of the $n \times n$ Hilbert matrix (for $n=2$ to $20$):
+\begin{enumerate}
+    \item Classical Gram-Schmidt (CGS, \texttt{cgs\_q})
+    \item Modified Gram-Schmidt (MGS, \texttt{mgs\_q})
+    \item Householder QR (\texttt{householder\_q})
+    \item Classical Gram-Schmidt Twice (CGS-Twice, \texttt{cgs\_twice\_q})
+\end{enumerate}
+For implementation details, please see the \texttt{Project1\_Q2.py} file.
+
+\subsection*{(d)}
+The quality of the computed $Q$ from each method was assessed by plotting the orthogonality loss, $\log_{10}(\|I - Q^T Q\|_F)$, versus the matrix size $n$, as shown in Figure~\ref{fig:ortho_loss}.
+
+\begin{figure}[h!]
+    \centering
+    \includegraphics[width=0.8\textwidth]{Project1_A2d_orthogonality_loss.png}
+    \caption{Orthogonality Loss vs. Matrix Size for QR Methods.}
+    \label{fig:ortho_loss}
+\end{figure}
+
+A summary of the loss and computation time for $n = 4, 9, 11$ is provided in Table~\ref{tab:qr_results}.
+
+\begin{table}[h!]
+    \centering
+    \begin{tabular}{|c|l|r|r|}
+        \hline
+        \textbf{n} & \textbf{Method} & \textbf{Loss ($log_{10}$)} & \textbf{Time (s)} \\
+        \hline
+        4 & Classical Gram-Schmidt & -10.311054 & 4.28e-05 \\
+        4 & Modified Gram-Schmidt & -12.374458 & 5.89e-05 \\
+        4 & Householder & -15.351739 & 1.42e-04 \\
+        4 & Classical Gram-Schmidt Twice & -15.570756 & 8.99e-05 \\
+        \hline
+        9 & Classical Gram-Schmidt & 0.389425 & 2.89e-04 \\
+        9 & Modified Gram-Schmidt & -5.257679 & 3.50e-04 \\
+        9 & Householder & -14.715202 & 6.19e-04 \\
+        9 & Classical Gram-Schmidt Twice & -8.398044 & 6.07e-04 \\
+        \hline
+        11 & Classical Gram-Schmidt & 0.609491 & 5.23e-04 \\
+        11 & Modified Gram-Schmidt & -2.005950 & 5.77e-04 \\
+        11 & Householder & -14.697055 & 8.68e-04 \\
+        11 & Classical Gram-Schmidt Twice & -1.745087 & 1.07e-03 \\
+        \hline
+    \end{tabular}
+    \caption{Loss and computation time for selected matrix sizes.}
+    \label{tab:qr_results}
+\end{table}
+
+\subsection*{(e)}
+The speed and accuracy of the four methods were compared based on the plots in Figure~\ref{fig:ortho_loss} and Figure~\ref{fig:time_taken}.
+
+\begin{figure}[h!]
+    \centering
+    \includegraphics[width=0.8\textwidth]{Project1_A2d_time_taken.png}
+    \caption{Computation Time vs. Matrix Size for QR Methods.}
+    \label{fig:time_taken}
+\end{figure}
+
+\begin{itemize}
+    \item \textbf{Accuracy:} Householder is the most accurate and stable. MGS is significantly better than CGS. CGS-Twice improves on CGS, achieving accuracy comparable to MGS. CGS is highly unstable and loses orthogonality quickly.
+    \item \textbf{Speed:} CGS and MGS are the fastest. Householder is slightly slower, and CGS-Twice is the slowest.
+\end{itemize}
+
+\section{Least Square Problem}
+
+\subsection*{(a)}
+The problem is formulated as $Ax = b$, where $A$ is an $(N+1) \times (n+1)$ Vandermonde matrix, $x$ is the $(n+1) \times 1$ vector of unknown polynomial coefficients $[a_0, \dots, a_n]^T$, and $b$ is the $(N+1) \times 1$ vector of known function values $f(t_j)$.
+
+\subsection*{(b)}
+The least squares problem was solved using the implemented Householder QR factorization (\texttt{householder\_lstsq} in \texttt{Project1\_Q3.py}, the same function in Question 2) to find the coefficient vector $x$.
+
+\subsection*{(c)}
+The function $f(t) = 1 / (1 + t^2)$ and its polynomial approximation $p(t)$ were plotted for $N=30$ and $n=5, 15, 30$, as shown in Figure~\ref{fig:ls_approx}.
+
+\begin{figure}[h!]
+    \centering
+    \includegraphics[width=0.8\textwidth]{Project1_A3c_least_squares_approximation.png}
+    \caption{Least squares approximation of $f(t)=1/(1+t^2)$ for varying polynomial degrees $n$.}
+    \label{fig:ls_approx}
+\end{figure}
+
+When $n=15$, the approximation is excellent. When $n=30$, the polynomial interpolates the points but exhibits wild oscillations between them.
+
+\subsection*{(d)}
+No, $p(t)$ will not converge to $f(t)$ if $N = n$ tends to infinity. Polynomial interpolation on equally spaced nodes diverges for this function, as demonstrated by the severe oscillations in the $n=30$ case shown in Figure~\ref{fig:ls_approx}.
+
+\subsection*{(e)}
+The error between the computed and true coefficients was plotted against the polynomial degree $n$, as shown in Figure~\ref{fig:coeff_error}.
+
+\begin{figure}[h!]
+    \centering
+    \includegraphics[width=0.8\textwidth]{Project1_A3e_coefficient_error.png}
+    \caption{Error in computed polynomial coefficients vs. polynomial degree $n$.}
+    \label{fig:coeff_error}
+\end{figure}
+
+The error in the computed coefficients grows significantly as $n$ increases.
+
+\end{document}
--- a/project1/project-1.pdf
+++ b/project1/project-1.pdf
--- a/project2/iterative_solvers.py
+++ b/project2/iterative_solvers.py
@@ -0,0 +1,154 @@
+import numpy as np
+from typing import Callable, Any, List, Tuple
+
+# Tolerance and maximum iterations
+TOL = 1e-10
+MAX_ITER = 20000
+
+def stationary_method(
+        b: np.ndarray,
+        method: str,
+        get_diag_inv: Callable[[int, Any], float],
+        get_off_diag_sum: Callable[[np.ndarray, int, Any], float],
+        mat_vec_prod: Callable[[np.ndarray, Any], np.ndarray],
+        omega: float = 1.0,
+        **kwargs
+    ) -> Tuple[np.ndarray, int, List[float]]:
+    """
+    Solves Ax=b using stationary methods (Jacobi, Gauss-Seidel, SOR).
+    """
+    n = len(b)
+    x = np.zeros(n)
+    r0 = b.copy()
+    r0_norm = np.linalg.norm(r0)
+    if r0_norm == 0:
+        return x, 0, [0.0]
+        
+    residual_history = []
+
+    for k in range(MAX_ITER):
+        # 1. Calculate current residual and its norm
+        r = b - mat_vec_prod(x, **kwargs)
+        res_norm = np.linalg.norm(r)
+        
+        # 2. Append to history
+        residual_history.append(res_norm)
+        
+        # 3. Check for convergence
+        if res_norm / r0_norm < TOL:
+            return x, k, residual_history
+        
+        # 4. If not converged, perform the next iteration update
+        if method == 'jacobi':
+            x_old = x.copy()
+            for i in range(n):
+                off_diag_val = get_off_diag_sum(x_old, i, **kwargs)
+                diag_inv_val = get_diag_inv(i, **kwargs)
+                x[i] = diag_inv_val * (b[i] - off_diag_val)
+        else: # Gauss-Seidel and SOR
+            x_k_iter = x.copy() # Needed for SOR
+            for i in range(n):
+                off_diag_val = get_off_diag_sum(x, i, **kwargs)
+                diag_inv_val = get_diag_inv(i, **kwargs)
+                x_gs = diag_inv_val * (b[i] - off_diag_val)
+                
+                if method == 'gauss_seidel':
+                    x[i] = x_gs
+                elif method == 'sor':
+                    x[i] = (1 - omega) * x_k_iter[i] + omega * x_gs
+    
+    # If loop finishes (MAX_ITER reached), calculate and append final residual
+    r_final = b - mat_vec_prod(x, **kwargs)
+    residual_history.append(np.linalg.norm(r_final))
+    return x, MAX_ITER, residual_history
+
+
+def steepest_descent(
+        mat_vec_prod: Callable[[np.ndarray, Any], np.ndarray],
+        b: np.ndarray,
+        **kwargs
+    ) -> Tuple[np.ndarray, int, List[float]]:
+    """
+    Solves Ax=b using Steepest Descent, with corrected residual logging.
+    """
+    x = np.zeros_like(b)
+    r = b.copy()
+    
+    r0_norm = np.linalg.norm(r)
+    if r0_norm == 0:
+        return x, 0, [0.0]
+        
+    residual_history = []
+    
+    for k in range(MAX_ITER):
+        # 1. Current residual norm is from previous step (or initial)
+        res_norm = np.linalg.norm(r)
+        
+        # 2. Append to history
+        residual_history.append(res_norm)
+        
+        # 3. Check for convergence BEFORE the update
+        if res_norm / r0_norm < TOL:
+            return x, k, residual_history
+            
+        # 4. If not converged, compute update
+        Ar = mat_vec_prod(r, **kwargs)
+        r_dot_Ar = np.dot(r, Ar)
+        if r_dot_Ar == 0: # Should not happen for SPD if r!=0
+            break
+        alpha = res_norm**2 / r_dot_Ar
+        
+        x += alpha * r
+        r -= alpha * Ar
+        
+    # If loop finishes, append final residual
+    residual_history.append(np.linalg.norm(r))
+    return x, MAX_ITER, residual_history
+
+
+def conjugate_gradient(
+        mat_vec_prod: Callable[[np.ndarray, Any], np.ndarray],
+        b: np.ndarray,
+        **kwargs
+    ) -> Tuple[np.ndarray, int, List[float]]:
+    """
+    Solves Ax=b using Conjugate Gradient, with corrected residual logging.
+    """
+    x = np.zeros_like(b)
+    r = b.copy()
+    p = r.copy()
+    
+    r0_norm = np.linalg.norm(r)
+    if r0_norm == 0:
+        return x, 0, [0.0]
+        
+    res_norm_old = r0_norm
+    residual_history = []
+    
+    for k in range(MAX_ITER):
+        # 1. Current residual norm is from previous step
+        # 2. Append to history
+        residual_history.append(res_norm_old)
+        
+        # 3. Check for convergence
+        if res_norm_old / r0_norm < TOL:
+            return x, k, residual_history
+            
+        # 4. If not converged, compute update
+        Ap = mat_vec_prod(p, **kwargs)
+        p_dot_Ap = np.dot(p, Ap)
+        if p_dot_Ap == 0:
+            break
+        alpha = res_norm_old**2 / p_dot_Ap
+        
+        x += alpha * p
+        r -= alpha * Ap
+        
+        res_norm_new = np.linalg.norm(r)
+        beta = res_norm_new**2 / res_norm_old**2
+        
+        p = r + beta * p
+        res_norm_old = res_norm_new
+    # If loop finishes, append final residual
+    residual_history.append(res_norm_old)
+    return x, MAX_ITER, residual_history
--- a/project2/main.tex
+++ b/project2/main.tex
@@ -0,0 +1,187 @@
+\documentclass{article}
+
+% Language setting
+\usepackage[english]{babel}
+
+% Set page size and margins
+\usepackage[letterpaper,top=2cm,bottom=2cm,left=3cm,right=3cm,marginparwidth=1.75cm]{geometry}
+
+% Useful packages
+\usepackage{amsmath}
+\usepackage{graphicx}
+\usepackage{amsfonts}
+\usepackage{float} % For better table and figure placement
+\usepackage[colorlinks=true, allcolors=blue]{hyperref}
+\usepackage{array} % For better table column definitions
+
+\title{MATH 6601 - Project 2 Report}
+\author{Zhe Yuan (yuan.1435)}
+\date{Nov 2025}
+
+\begin{document}
+\maketitle
+
+\section*{Common Iterative Methods for Both Problems}
+This project implements five iterative methods to solve large, sparse, symmetric positive-definite (SPD) linear systems of the form $Ax=b$. The implemented methods are:
+\begin{itemize}
+    \item Jacobi method
+    \item Gauss-Seidel method
+    \item Successive Over-Relaxation (SOR) method
+    \item Steepest Descent method
+    \item Conjugate Gradient method
+\end{itemize}
+All five methods are implemented in Python. The core logic for each solver is contained in the `iterative\_solvers.py' file. The specific problems are set up and solved in `problem1.py' and `problem2.py', respectively.
+
+The initial guess was $x^{(0)}=0$, and the stopping condition was $\|r^{(k)}\|_2 / \|r^{(0)}\|_2 < 10^{-10}$. All $A$ were not explicitly constructed.
+
+\section{Problem 1: Ordinary Differential Equations}
+This problem solves the boundary value problem $-u'' = t$ on $(0,1)$ with $u(0)=u(1)=0$. To solve the problem numerically, the interval $(0,1)$ is discretized into $n+1$ subintervals of width $h=1/(n+1)$. The second derivative $u''(t_i)$ is approximated using a central difference scheme:
+\[ u''(t_i) = -t_i \approx \frac{u(t_{i-1}) - 2u(t_i) + u(t_{i+1})}{h^2} \quad \implies \quad -u_{i-1} + 2u_i - u_{i+1} = h^2 t_i \]
+for the internal grid points $i=1, \dots, n$. Combined with the boundary conditions $u_0=0$ and $u_{n+1}=0$, this forms a linear system $Au=b$, where $u = [u_1, \dots, u_n]^T$. The matrix $A \in \mathbb{R}^{n \times n}$ is a tridiagonal matrix, and the vector $b \in \mathbb{R}^n$ is given by:
+\[
+A = \begin{pmatrix}
+    2 & -1 & & & \\
+    -1 & 2 & -1 & & \\
+    & \ddots & \ddots & \ddots & \\
+    & & -1 & 2 & -1 \\
+    & & & -1 & 2
+\end{pmatrix}, \quad
+b = h^2 \begin{pmatrix} t_1 \\ t_2 \\ \vdots \\ t_n \end{pmatrix}
+\]
+
+\subsection*{(a) Exact Solution}
+The boundary value problem is given by $-u'' = t$ on the interval $(0, 1)$ with boundary conditions $u(0) = u(1) = 0$.
+Integrating twice gives the general solution:
+\[ u(t) = -\frac{t^3}{6} - C_1 t - C_2 \]
+Applying the boundary conditions $u(0)=0$ and $u(1)=0$, we find the constants $C_2=0$ and $C_1 = -1/6$. Thus, the exact solution is:
+\[ u(t) = \frac{t - t^3}{6} \]
+The plot of this exact solution is shown in Figure~\ref{fig:p1_exact_solution}.
+\begin{figure}[H]
+    \centering
+    \includegraphics[width=0.8\textwidth]{problem1_exact_solution.png}
+    \caption{Plot of the exact solution $u(t) = (t-t^3)/6$.}
+    \label{fig:p1_exact_solution}
+\end{figure}
+
+\subsection*{(b, c) Iteration Solution}
+According to the requirments from 1(b), The linear system was solved for $n=20$ and $n=40$. For SOR, the optimal relaxation parameter $\omega = \frac{2}{1+\sin(\pi h)}$ was used. The number of iterations required for each method to converge is summarized in Table~\ref{tab:p1_iterations}.
+
+\begin{table}[H]
+\centering
+\begin{tabular}{|l|r|r|}
+\hline
+\textbf{Method} & \textbf{Iterations (n=20)} & \textbf{Iterations (n=40)} \\
+\hline
+Jacobi & 2031 & 7758 \\
+Gauss-Seidel & 1018 & 3882 \\
+SOR & 94 & 183 \\
+Steepest Descent & 2044 & 7842\\
+Conjugate Gradient & 20 & 40 \\
+\hline
+\end{tabular}
+\caption{Number of iterations for each method for Problem 1.}
+\label{tab:p1_iterations}
+\end{table}
+
+\noindent \textbf{Observations:}
+\begin{enumerate}
+    \item The Conjugate Gradient method is the most efficient, requiring the fewest iterations. SOR is the second-best with a significant speedup over Gauss-Seidel. Gauss-Seidel converges about twice as fast as Jacobi. The Steepest Descent method performs poorly, rivaling Jacobi in its slow convergence.
+    \item As $n$ doubles, the number of iterations increases for all methods. The iteration count for Jacobi, Gauss-Seidel, and Steepest Descent increases by a factor of roughly 4, while for SOR and CG, the increase is closer to a factor of 2.
+\end{enumerate}
+
+\subsection*{(d) Convergence History}
+The convergence history is shown in Figures~\ref{fig:p1_conv_n20} and \ref{fig:p1_conv_n40}. The stationary methods and SD show linear convergence, while CG shows superlinear convergence.
+
+\begin{figure}[H]
+    \centering
+    \includegraphics[width=0.8\textwidth]{problem1_convergence_n20.png}
+    \caption{Convergence history for Problem 1 with n=20.}
+    \label{fig:p1_conv_n20}
+\end{figure}
+
+\begin{figure}[H]
+    \centering
+    \includegraphics[width=0.8\textwidth]{problem1_convergence_n40.png}
+    \caption{Convergence history for Problem 1 with n=40.}
+    \label{fig:p1_conv_n40}
+\end{figure}
+
+\newpage
+\section{Problem 2: Partial Differential Equation}
+This problem involves solving the PDE $-\nabla^2 u + u = 1$ (this should be $-\nabla^2 u + u = 1$ instead of $-\nabla u(\text{vector}) + u(\text{scalar}) = 1$ in question) on the unit square $[0,1]^2$ with zero boundary conditions. To solve the problem numerically, a finite difference approximation on an $n \times n$ grid of interior points leads to the discrete equations:
+\[ (4+h^2)u_{i,j} - u_{i-1,j} - u_{i,j-1} - u_{i+1,j} - u_{i,j+1} = h^2, \quad i,j=1,\dots,n \]
+To formulate this as a standard matrix system $Ax=b$, we reshape the 2D array of unknowns $u_{i,j}$ into a single 1D vector $x$ of length $N=n^2$. After flattening, $u_{i,j}$ maps to the index $k = (i-1)n + j$ in the vector $x$, the matrix $A \in \mathbb{R}^{N \times N}$ becomes a large, sparse, block tridiagonal matrix:
+\[
+A = \begin{pmatrix}
+    T & -I & & & \\
+    -I & T & -I & & \\
+    & \ddots & \ddots & \ddots & \\
+    & & -I & T & -I \\
+    & & & -I & T
+\end{pmatrix}_{n^2 \times n^2}
+\]
+where $I$ is the $n \times n$ identity matrix, and $T$ is an $n \times n$ tridiagonal matrix given by:
+\[
+T = \begin{pmatrix}
+    4+h^2 & -1 & & & \\
+    -1 & 4+h^2 & -1 & & \\
+    & \ddots & \ddots & \ddots & \\
+    & & -1 & 4+h^2 & -1 \\
+    & & & -1 & 4+h^2
+\end{pmatrix}_{n \times n}
+\]
+The right-hand side vector $b \in \mathbb{R}^{N}$ is a constant vector where every element is $h^2$. So:
+
+\[
+(A_{i,i}=T)_{j,j}x_{(i-1)n + j} = (4+h^2)u_{i,j}, (A_{i-1,i}=I)_{j,j}x_{(i-2)n + j} = u_{i-1,j},\dots
+\]
+
+\subsection*{(a) Iterative Solution}
+The system was solved for $n=16$ ($N=256$) and $n=32$ ($N=1024$) using the same five iterative methods. The number of iterations to reach convergence is reported in Table~\ref{tab:p2_iterations}.
+
+\begin{table}[H]
+\centering
+\begin{tabular}{|l|r|r|}
+\hline
+\textbf{Method} & \textbf{Iterations (n=16)} & \textbf{Iterations (n=32)} \\
+\hline
+Jacobi & 1268 & 4792 \\
+Gauss-Seidel & 635 & 2397 \\
+SOR & 71 & 138 \\
+Steepest Descent & 1247 & 4807 \\
+Conjugate Gradient & 31 & 66 \\
+\hline
+\end{tabular}
+\caption{Number of iterations for each method for Problem 2.}
+\label{tab:p2_iterations}
+\end{table}
+
+\noindent \textbf{Observations:}
+The relative performance of the methods remains consistent with Problem 1: CG is the fastest, followed by SOR, Gauss-Seidel, Jacobi, and Steepest Descent. Doubling $n$ from 16 to 32 quadruples the number of unknowns. Again, the iteration counts for slower methods increase by a factor of approximately 4, while for CG and SOR, the increase is only about a factor of 2. This reinforces the conclusion that CG and SOR scale much better with problem size.
+
+\subsection*{(b) Convergence History}
+The convergence history plots are shown in Figures~\ref{fig:p2_conv_n16} and \ref{fig:p2_conv_n32}.
+
+\begin{figure}[H]
+    \centering
+    \includegraphics[width=0.8\textwidth]{problem2_convergence_n16.png}
+    \caption{Convergence history for Problem 2 with n=16.}
+    \label{fig:p2_conv_n16}
+\end{figure}
+
+\begin{figure}[H]
+    \centering
+    \includegraphics[width=0.8\textwidth]{problem2_convergence_n32.png}
+    \caption{Convergence history for Problem 2 with n=32.}
+    \label{fig:p2_conv_n32}
+\end{figure}
+
+\subsection*{(c) Advantages of Iterative Methods}
+For large, sparse linear systems arising from PDE discretizations, iterative methods offer significant advantages over direct methods:
+\begin{enumerate}
+    \item Iterative methods typically only require storing a few vectors of size $N$, leading to a memory complexity of $O(N)$. In contrast, direct methods require denser helper matrices like $Q$ and $R$. 
+    \item The cost per iteration for these problems is dominated by the sparse matrix-vector product, which is $O(N)$. If the method converges in $K$ iterations, the total cost is $O(KN)$. If a good iterative method is used, $K$ can be much smaller than $N$ (like C.G.). Direct sparse solvers often have a higher complexity. When $N$ is very large, iterative methods can be much faster.
+    \item Implementing iterative methods is often simpler than implementing a direct solver for sparse matrix.
+\end{enumerate}
+
+\end{document}
--- a/project2/problem1.py
+++ b/project2/problem1.py
@@ -0,0 +1,160 @@
+import numpy as np
+import matplotlib.pyplot as plt
+from iterative_solvers import *
+
+# (a): Exact Solution
+def exact_solution(t: np.ndarray) -> np.ndarray:
+    """Computes the exact solution u(t) = t/6 * (1 - t^2)."""
+    return t / 6.0 * (1 - t**2)
+
+def plot_exact_solution():
+    """Plots the exact solution of the BVP."""
+    t_fine = np.linspace(0, 1, 500)
+    u_exact_fine = exact_solution(t_fine)
+    
+    plt.figure(figsize=(10, 6))
+    plt.plot(t_fine, u_exact_fine, 'k-', label='Exact Solution $u(t) = t/6 \cdot (1 - t^2)$')
+    plt.title('Exact Solution of $-u\'\'=t$ with $u(0)=u(1)=0$')
+    plt.xlabel('$t$')
+    plt.ylabel('$u(t)$')
+    plt.grid(True)
+    plt.legend()
+    plt.savefig('problem1_exact_solution.png')
+    # plt.show()
+    print("Exact solution plot saved to 'problem1_exact_solution.png'")
+
+
+# (b): Helper functions for iterative methods
+def mat_vec_prod_p1(x: np.ndarray, n: int) -> np.ndarray:
+    """Computes the matrix-vector product Ax for Problem 1."""
+    y = np.zeros(n)
+    # A is tridiagonal with [ -1, 2, -1 ]
+    # y_i = -x_{i-1} + 2x_i - x_{i+1}
+    for i in range(n):
+        term_prev = -x[i-1] if i > 0 else 0
+        term_next = -x[i+1] if i < n - 1 else 0
+        y[i] = term_prev + 2 * x[i] + term_next
+    return y
+
+def get_diag_inv_p1(i: int, n: int) -> float:
+    """Returns 1/A_ii for Problem 1. Diagonal elements are all 2, so inverse is 1/2."""
+    return 1.0 / 2.0
+
+def get_off_diag_sum_p1(x: np.ndarray, i: int, n: int) -> float:
+    """Computes sum_{j!=i} A_ij * x_j. For Problem 1, A_ij = -1 for j=i-1, i+1, else 0."""
+    sum_val = 0.0
+    if i > 0:
+        sum_val += -x[i-1]
+    if i < n - 1:
+        sum_val += -x[i+1]
+    return sum_val
+
+def solve_and_report(n: int):
+    """
+    Solves the linear system for a given n and reports results.
+    """
+    print(f"\n--- Solving for n = {n} ---")
+    h = 1.0 / (n + 1)
+    
+    # Setup the right-hand side vector b
+    t = np.linspace(h, 1.0 - h, n)
+    b = (h**2) * t
+    
+    # Calculate SOR parameter omega
+    omega = 2.0 / (1.0 + np.sin(np.pi * h))
+    
+    # Store results
+    iteration_counts = []
+    all_residuals = {}
+    all_solutions = {}
+    # Define methods and run solvers
+    methods_to_run = {
+        'Jacobi': ('jacobi', {}),
+        'Gauss-Seidel': ('gauss_seidel', {}),
+        'SOR': ('sor', {'omega': omega}),
+        'Steepest Descent': (steepest_descent, {}),
+        'Conjugate Gradient': (conjugate_gradient, {})
+    }
+    
+    print("\nStarting iterative solvers...")
+    for name, (method_func, params) in methods_to_run.items():
+        print(f"Running {name}...")
+        common_args = {'b': b, 'n': n}
+        if isinstance(method_func, str):
+            solver_args = { 'method': method_func, 'get_diag_inv': get_diag_inv_p1,
+                            'get_off_diag_sum': get_off_diag_sum_p1, 'mat_vec_prod': mat_vec_prod_p1,
+                            **common_args, **params }
+            solution, iters, res_hist = stationary_method(**solver_args)
+        else:
+            solver_args = {'mat_vec_prod': mat_vec_prod_p1, **common_args}
+            solution, iters, res_hist = method_func(**solver_args)
+        iteration_counts.append((name, iters))
+        all_residuals[name] = res_hist
+        all_solutions[name] = solution if iters < MAX_ITER else None
+    # (c): Report iteration counts
+    print("\n--- Iteration Counts ---")
+    for name, iters in iteration_counts:
+        status = "converged" if iters < MAX_ITER else "did NOT converge"
+        print(f"{name:<20}: {iters} iterations ({status}, last residual = {all_residuals[name][-1]:.2e})")
+    # (d): Plot residue history
+    plt.figure(figsize=(12, 8))
+    for name, res_hist in all_residuals.items():
+        res_log = np.log10(np.array(res_hist) + 1e-20)
+        plt.plot(res_log, label=name, linestyle='-')
+    
+    plt.title(f'Convergence History for n = {n}')
+    plt.xlabel('Iteration Step (m)')
+    plt.ylabel('log10(||r^(m)||_2)')
+    plt.legend()
+    plt.grid(True)
+    
+    # Set the y-axis limit to make the plot readable
+    current_ylim = plt.ylim()
+    plt.ylim(bottom=max(current_ylim[0], -13), top=current_ylim[1])
+    plt.savefig(f'problem1_convergence_n{n}.png')
+    # plt.show()
+    print(f"\nConvergence plot saved to 'problem1_convergence_n{n}.png'")
+    
+    if all_solutions:
+        plt.figure(figsize=(12, 8))
+        
+        # Plot exact solution on a fine grid
+        t_fine = np.linspace(0, 1, 500)
+        u_exact_fine = exact_solution(t_fine)
+        plt.plot(t_fine, u_exact_fine, 'k-', label='Exact Solution', linewidth=1, zorder=10) # Black, thick, on top
+        
+        # Define some styles for the different numerical methods
+        styles = {
+            'Jacobi':          {'color': 'red',   'linestyle': '--'},
+            'Gauss-Seidel':    {'color': 'blue',  'linestyle': '-.'},
+            'SOR':             {'color': 'green', 'linestyle': ':'},
+            'Steepest Descent':{'color': 'purple','linestyle': '--'},
+            'Conjugate Gradient':{'color': 'orange','linestyle': '-.'},
+        }
+        
+        # Plot each numerical solution
+        for name, solution in all_solutions.items():
+            # Add boundary points for a complete plot
+            t_numerical_with_bounds = np.concatenate(([0], t, [1]))
+            u_numerical_with_bounds = np.concatenate(([0], solution, [0]))
+            
+            style = styles.get(name, {'color': 'gray', 'linestyle': '-'})
+            plt.plot(t_numerical_with_bounds, u_numerical_with_bounds, 
+                     label=f'Numerical ({name})', **style, linewidth=2)
+        
+        plt.title(f'Comparison of Exact and Numerical Solutions for n = {n}')
+        plt.xlabel('$t$')
+        plt.ylabel('$u(t)$')
+        plt.legend()
+        plt.grid(True)
+        plt.savefig(f'problem1_all_solutions_comparison_n{n}.png')
+        # plt.show()
+        print(f"All solutions comparison plot saved to 'problem1_all_solutions_comparison_n{n}.png'")
+    
+if __name__ == "__main__":
+    # Part (a)
+    plot_exact_solution()
+    
+    # Part (b), (c), (d)
+    solve_and_report(n=20)
+    solve_and_report(n=40)
--- a/project2/problem1_all_solutions_comparison_n20.png
+++ b/project2/problem1_all_solutions_comparison_n20.png
--- a/project2/problem1_all_solutions_comparison_n40.png
+++ b/project2/problem1_all_solutions_comparison_n40.png
--- a/project2/problem1_convergence_n20.png
+++ b/project2/problem1_convergence_n20.png
--- a/project2/problem1_convergence_n40.png
+++ b/project2/problem1_convergence_n40.png
--- a/project2/problem1_exact_solution.png
+++ b/project2/problem1_exact_solution.png
--- a/project2/problem1_output.txt
+++ b/project2/problem1_output.txt
@@ -0,0 +1,39 @@
+Exact solution plot saved to 'problem1_exact_solution.png'
+
+--- Solving for n = 20 ---
+
+Starting iterative solvers...
+Running Jacobi...
+Running Gauss-Seidel...
+Running SOR...
+Running Steepest Descent...
+Running Conjugate Gradient...
+
+--- Iteration Counts ---
+Jacobi              : 2031 iterations (converged, last residual = 5.78e-13)
+Gauss-Seidel        : 1018 iterations (converged, last residual = 5.72e-13)
+SOR                 : 94 iterations (converged, last residual = 4.52e-13)
+Steepest Descent    : 2044 iterations (converged, last residual = 5.74e-13)
+Conjugate Gradient  : 20 iterations (converged, last residual = 1.39e-18)
+
+Convergence plot saved to 'problem1_convergence_n20.png'
+All solutions comparison plot saved to 'problem1_all_solutions_comparison_n20.png'
+
+--- Solving for n = 40 ---
+
+Starting iterative solvers...
+Running Jacobi...
+Running Gauss-Seidel...
+Running SOR...
+Running Steepest Descent...
+Running Conjugate Gradient...
+
+--- Iteration Counts ---
+Jacobi              : 7758 iterations (converged, last residual = 2.15e-13)
+Gauss-Seidel        : 3882 iterations (converged, last residual = 2.16e-13)
+SOR                 : 183 iterations (converged, last residual = 2.04e-13)
+Steepest Descent    : 7842 iterations (converged, last residual = 2.16e-13)
+Conjugate Gradient  : 40 iterations (converged, last residual = 5.40e-19)
+
+Convergence plot saved to 'problem1_convergence_n40.png'
+All solutions comparison plot saved to 'problem1_all_solutions_comparison_n40.png'
--- a/project2/problem2.py
+++ b/project2/problem2.py
@@ -0,0 +1,147 @@
+import numpy as np
+import matplotlib.pyplot as plt
+from iterative_solvers import *
+
+def mat_vec_prod_p2(x_flat: np.ndarray, n: int, h_sq: float) -> np.ndarray:
+    """
+    Computes the matrix-vector product y = Ax for the 2D PDE problem.
+    """
+    x_2d = x_flat.reshape((n, n))
+    x_padded = np.zeros((n + 2, n + 2))
+    x_padded[1:-1, 1:-1] = x_2d
+    
+    y_2d = np.zeros((n, n))
+    
+    # Apply the finite difference stencil: (4+h^2)u_ij - u_{i-1,j} - u_{i+1,j} - u_{i,j-1} - u_{i,j+1}
+    for i in range(n):
+        for j in range(n):
+            y_2d[i, j] = (4.0 + h_sq) * x_padded[i + 1, j + 1] \
+                       - x_padded[i, j + 1] \
+                       - x_padded[i + 2, j + 1] \
+                       - x_padded[i + 1, j] \
+                       - x_padded[i + 1, j + 2]
+                       
+    return y_2d.flatten()
+
+def get_diag_inv_p2(i: int, n: int, h_sq: float) -> float:
+    """Returns 1/A_ii for Problem 2. Diagonal is constant: 4 + h^2."""
+    return 1.0 / (4.0 + h_sq)
+
+def get_off_diag_sum_p2(x_flat: np.ndarray, i_flat: int, n: int, **kwargs) -> float:
+    """Computes the off-diagonal sum for a given row `i_flat` in Problem 2."""
+    row = i_flat // n
+    col = i_flat % n
+    sum_val = 0.0
+    
+    if row > 0: sum_val += -x_flat[i_flat - n]
+    if row < n - 1: sum_val += -x_flat[i_flat + n]
+    if col > 0: sum_val += -x_flat[i_flat - 1]
+    if col < n - 1: sum_val += -x_flat[i_flat + 1]
+        
+    return sum_val
+
+def solve_and_report_p2(n: int):
+    """Solves the 2D PDE linear system for a given n and reports results."""
+    print(f"\n--- Solving for n = {n} (System size: {n*n} x {n*n}) ---")
+    h = 1.0 / (n + 1)
+    h_sq = h**2
+    N = n * n
+    
+    b = np.full(N, h_sq)
+    omega = 2.0 / (1.0 + np.sin(np.pi * h))
+    
+    iteration_counts = []
+    all_residuals = {}
+    all_solutions = {}
+
+    methods_to_run = {
+        'Jacobi': ('jacobi', {}),
+        'Gauss-Seidel': ('gauss_seidel', {}),
+        'SOR': ('sor', {'omega': omega}),
+        'Steepest Descent': (steepest_descent, {}),
+        'Conjugate Gradient': (conjugate_gradient, {})
+    }
+    
+    print("\nStarting iterative solvers...")
+    for name, (method_func, params) in methods_to_run.items():
+        print(f"Running {name}...")
+        
+        solver_kwargs = {'n': n, 'h_sq': h_sq}
+        
+        if isinstance(method_func, str):
+            solver_args = {'b': b, 'method': method_func, 'get_diag_inv': get_diag_inv_p2, 
+                           'get_off_diag_sum': get_off_diag_sum_p2, 'mat_vec_prod': mat_vec_prod_p2,
+                           **solver_kwargs, **params}
+            solution, iters, res_hist = stationary_method(**solver_args)
+        else:
+            solver_args = {'b': b, 'mat_vec_prod': mat_vec_prod_p2, **solver_kwargs}
+            solution, iters, res_hist = method_func(**solver_args)
+        
+        iteration_counts.append((name, iters))
+        all_residuals[name] = res_hist
+        all_solutions[name] = solution if iters < MAX_ITER else None
+
+    # Report iteration counts
+    print("\n--- Iteration Counts ---")
+    for name, iters in iteration_counts:
+        status = "converged" if iters < MAX_ITER else "did NOT converge"
+        print(f"{name:<20}: {iters} iterations ({status})")
+
+    # Plot residue history
+    plt.figure(figsize=(12, 8))
+    for name, res_hist in all_residuals.items():
+        res_log = np.log10(np.array(res_hist) + 1e-20)
+        plt.plot(res_log, label=name, linestyle='-')
+    
+    plt.title(f'Convergence History for PDE Problem, n = {n}')
+    plt.xlabel('Iteration Step (m)')
+    plt.ylabel('log10(||r^(m)||_2)')
+    plt.legend()
+    plt.grid(True)
+    
+    current_ylim = plt.ylim()
+    plt.ylim(bottom=max(current_ylim[0], -13), top=current_ylim[1])
+    
+    plt.savefig(f'problem2_convergence_n{n}.png')
+    print(f"\nConvergence plot saved to 'problem2_convergence_n{n}.png'")
+
+    if all_solutions:
+        print("Generating 3D surface plots of the solutions...")
+        
+        # Create the X, Y grid for the surface plot, including boundaries
+        plot_grid = np.linspace(0, 1, n + 2)
+        X, Y = np.meshgrid(plot_grid, plot_grid)
+        
+        # Create a figure for the subplots
+        fig = plt.figure(figsize=(18, 10))
+        fig.suptitle(f'3D Surface Plots of Numerical Solutions for n = {n}', fontsize=16)
+        # Loop through the stored solutions and create a subplot for each
+        for i, (name, solution_flat) in enumerate(all_solutions.items()):
+            # Reshape the 1D solution vector into a 2D grid
+            solution_2d = solution_flat.reshape((n, n))
+            
+            # Pad the solution with zero boundaries for plotting
+            u_padded = np.zeros((n + 2, n + 2))
+            u_padded[1:-1, 1:-1] = solution_2d
+            
+            # Add a new 3D subplot
+            ax = fig.add_subplot(2, 3, i + 1, projection='3d')
+            
+            # Plot the surface
+            ax.plot_surface(X, Y, u_padded, cmap='viridis', edgecolor='none')
+            
+            # Set titles and labels for each subplot
+            ax.set_title(name)
+            ax.set_xlabel('x')
+            ax.set_ylabel('y')
+            ax.set_zlabel('u(x,y)')
+            ax.view_init(elev=30, azim=-60) # Set a nice viewing angle
+        plt.tight_layout(rect=[0, 0.03, 1, 0.95]) # Adjust layout to make room for suptitle
+        plt.savefig(f'problem2_3d_solutions_n{n}.png')
+        print(f"3D surface comparison plot saved to 'problem2_3d_solutions_n{n}.png'")
+
+if __name__ == "__main__":
+    # Solve Problem 2 for n=16 and n=32
+    solve_and_report_p2(n=16)
+    solve_and_report_p2(n=32)
+
--- a/project2/problem2_3d_solutions_n16.png
+++ b/project2/problem2_3d_solutions_n16.png
--- a/project2/problem2_3d_solutions_n32.png
+++ b/project2/problem2_3d_solutions_n32.png
--- a/project2/problem2_convergence_n16.png
+++ b/project2/problem2_convergence_n16.png
--- a/project2/problem2_convergence_n32.png
+++ b/project2/problem2_convergence_n32.png
--- a/project2/problem2_output.txt
+++ b/project2/problem2_output.txt
@@ -0,0 +1,40 @@
+
+--- Solving for n = 16 (System size: 256 x 256) ---
+
+Starting iterative solvers...
+Running Jacobi...
+Running Gauss-Seidel...
+Running SOR...
+Running Steepest Descent...
+Running Conjugate Gradient...
+
+--- Iteration Counts ---
+Jacobi              : 1268 iterations (converged)
+Gauss-Seidel        : 635 iterations (converged)
+SOR                 : 71 iterations (converged)
+Steepest Descent    : 1247 iterations (converged)
+Conjugate Gradient  : 31 iterations (converged)
+
+Convergence plot saved to 'problem2_convergence_n16.png'
+Generating 3D surface plots of the solutions...
+3D surface comparison plot saved to 'problem2_3d_solutions_n16.png'
+
+--- Solving for n = 32 (System size: 1024 x 1024) ---
+
+Starting iterative solvers...
+Running Jacobi...
+Running Gauss-Seidel...
+Running SOR...
+Running Steepest Descent...
+Running Conjugate Gradient...
+
+--- Iteration Counts ---
+Jacobi              : 4792 iterations (converged)
+Gauss-Seidel        : 2397 iterations (converged)
+SOR                 : 138 iterations (converged)
+Steepest Descent    : 4807 iterations (converged)
+Conjugate Gradient  : 66 iterations (converged)
+
+Convergence plot saved to 'problem2_convergence_n32.png'
+Generating 3D surface plots of the solutions...
+3D surface comparison plot saved to 'problem2_3d_solutions_n32.png'
Author	SHA1	Message	Date
Zhe Yuan	ee51578f99	upload result plot	2025-12-06 17:52:50 -05:00
Zhe Yuan	621fb1feb2	add homework11	2025-12-06 17:52:21 -05:00
Zhe Yuan	33a3157bc8	add homework10	2025-11-23 16:16:53 -05:00
Zhe Yuan	f9fdf4002c	remove unnecessary Zone.Identifier file from project2	2025-11-12 19:58:02 -05:00
Zhe Yuan	dd4675235d	add project2	2025-11-10 20:23:08 -05:00
Zhe Yuan	bd5715388b	add homework 8	2025-11-05 11:03:28 -05:00
Zhe Yuan	323f757b14	fix project1 q3 bug	2025-10-21 16:49:59 -04:00
Zhe Yuan	1ecd5a4bbe	fix project 1 q1 bug	2025-10-21 16:25:27 -04:00
Zhe Yuan	5acb5d6900	fix project 1 q3	2025-10-20 23:10:08 -04:00
Zhe Yuan	ad53ec4eeb	update readme and questions of project 1	2025-10-15 15:23:32 -04:00
Zhe Yuan	20965947f0	update latex report	2025-10-15 15:23:16 -04:00
Zhe Yuan	248720434f	update gitignore	2025-10-15 15:23:06 -04:00
				`@@ -0,0 +1 @@`
				`For problems (a) and (b), which have real roots, all methods converged; Newton's method was the fastest (quadratic), followed by the Secant method (superlinear), with the Chord method being the slowest (linear). However, for problem (c) (x^2 + 1), which has no real roots, all methods failed: the Chord method rapidly diverged to infinity, while Secant and Newton's method oscillated.`