# Suppose the model of the form d_b = C * v^2
# where d_b is the braking distance, v is the velocity, and C is a constant.
import numpy as np
import matplotlib.pyplot as plt

# We make up some data for d_b and v
v = np.array([10, 20, 30, 40, 50, 60, 70, 80, 90, 100])
d_b = np.array([2, 8, 18, 32, 50, 72, 98, 128, 162, 200])

# We can plot the data
plt.plot(v, d_b, 'o')
plt.title('Braking distance vs velocity (Raw Data)')
plt.xlabel('Velocity (m/s)')
plt.ylabel('Braking distance (m)')
plt.show()

# We can see that the data is quadratic, so we can fit a quadratic model to it
# We can use the polyfit function to fit a polynomial of degree 2 to the data
coefficients = np.polyfit(v, d_b, 2)
print('Coefficients:', coefficients)

# We can use the polyval function to evaluate the polynomial at the data points
d_b_fit = np.polyval(coefficients, v)

# We can plot the data and the fit
plt.plot(v, d_b, 'o', label='Data')
plt.plot(v, d_b_fit, label='Fit')
plt.title('Braking distance vs velocity (Quadratic Fit)')
plt.xlabel('Velocity (m/s)')
plt.ylabel('Braking distance (m)')
plt.legend()
plt.show()

Coefficients: [ 2.00000000e-02  4.24758863e-15 -1.71187836e-13]

# Based on the problem, we have the following
x = np.array([0.1, 0.2, 0.3, 0.4, 0.5])
y = np.array([0.06,0.12,0.36,0.65,0.95])

# We can plot the data
plt.plot(x, y, 'o')
plt.title('y vs x (Raw Data)')
plt.xlim(0, 0.6)
plt.ylim(0, 1)
plt.xlabel('x')
plt.ylabel('y')
plt.show()

# We can see that the data is quadratic, so we can fit a quadratic model to it
# We can use the polyfit function to fit a polynomial of degree 2 to the data
coefficients = np.polyfit(x, y, 2)
print('Coefficients:', coefficients)

# We can use the polyval function to evaluate the polynomial at the data points
y_fit = np.polyval(coefficients, x)

# We can plot the data and the fit
plt.plot(x, y, 'o', label='Data')
plt.plot(x, y_fit, label='Fit')
plt.title('y vs x (Quadratic Fit)')
plt.xlim(0, 0.6)
plt.ylim(0, 1)
plt.xlabel('x')
plt.ylabel('y')
plt.legend()
plt.show()

# Calculate the maximum absolute deviation
max_abs_deviation = np.max(np.abs(y - y_fit))
print('Maximum absolute deviation:', max_abs_deviation)

Coefficients: [3.78571429e+00 3.85714286e-02 6.03566116e-16]

Maximum absolute deviation: 0.039142857142857534

# We regards to the same problem

# Minimize the sum
min_sum = np.sum((y - y_fit)**2)
print('Minimize the sum:', min_sum)

Minimize the sum: 0.003005714285714285

# Assume that all trees are right-circular cylinders and are approximately the same height.
# The objective is to use the diameter of the tree to predict the number of board feet of lumber that can be obtained from the tree.
# The data is as follows:
x = np.array([17,19,20,23,25,28,32,38,39,41])
y = np.array([19,25,32,57,71,113,123,252,259,294])

# We can plot the data
plt.plot(x, y, 'o')
plt.title('The Number of Board Feet of Lumber vs Diameter of the Tree (Raw Data)')
plt.xlabel('Diameter of the Tree (in)')
plt.ylabel('The Number of Board Feet of Lumber')
plt.show()

# It is not easy to see the relationship between x and y, so we can take the logarithm of y and plot it against x again
y_log = np.log(y)
plt.plot(x, y_log, 'o')
plt.title('The Number of Board Feet of Lumber vs Diameter of the Tree (Logarithm of y)')
plt.xlabel('Diameter of the Tree (in)')
plt.ylabel('Log(The Number of Board Feet of Lumber)')
plt.show()

# We fit a quadratic model to the data
coefficients = np.polyfit(x, y_log, 2)
print('Coefficients:', coefficients)

# We can use the polyval function to evaluate the polynomial at the data points
y_log_fit = np.polyval(coefficients, x)

# Apply the Least-Square Criterion
min_sum = np.sum((y_log - y_log_fit)**2)
print('Minimize the sum:', min_sum)

# We can plot the data and the fit
plt.plot(x, y_log, 'o', label='Data')
plt.plot(x, y_log_fit, label='Fit')
plt.title('The Number of Board Feet of Lumber vs Diameter of the Tree (Quadratic Fit)')
plt.xlabel('Diameter of the Tree (in)')
plt.ylabel('Log(The Number of Board Feet of Lumber)')
plt.legend()
plt.show()

# We can convert the logarithm of y back to y
y_fit = np.exp(y_log_fit)

# Apply the Least-Square Criterion
min_sum = np.sum((y - y_fit)**2)
print('Minimize the sum:', min_sum)

# We can plot the data and the fit
plt.plot(x, y, 'o', label='Data')
plt.plot(x, y_fit, label='Fit')
plt.title('The Number of Board Feet of Lumber vs Diameter of the Tree (Quadratic Fit)')
plt.xlabel('Diameter of the Tree (in)')
plt.ylabel('The Number of Board Feet of Lumber')
plt.legend()
plt.show()

Coefficients: [-0.00295156  0.28393066 -1.02696457]
Minimize the sum: 0.08456348023205189

Minimize the sum: 1288.4760286362534

# We use the same data as before but with cubic model
# We fit a cubic model to the data
coefficients_cubic = np.polyfit(x, y_log, 3)
print('Coefficients:', coefficients_cubic)

# We can use the polyval function to evaluate the polynomial at the data points
y_log_fit_cubic = np.polyval(coefficients_cubic, x)

# Apply the Least-Square Criterion
min_sum = np.sum((y_log - y_log_fit_cubic)**2)
print('Minimize the sum:', min_sum)

# Transform the logarithm of y back to y
y_fit_cubic = np.exp(y_log_fit_cubic)

# Apply the Least-Square Criterion
min_sum = np.sum((y - y_fit_cubic)**2)
print('Minimize the sum:', min_sum)

# We can plot the data and the fit
plt.plot(x, y, 'o', label='Data')
plt.plot(x, y_fit, label='Quadratic Fit')
plt.plot(x, y_fit_cubic, label='Cubic Fit')
plt.title('The Number of Board Feet of Lumber vs Diameter of the Tree (Quadratic and Cubic Fit)')
plt.xlabel('Diameter of the Tree (in)')
plt.ylabel('The Number of Board Feet of Lumber')
plt.legend()
plt.show()

Coefficients: [ 1.56744915e-04 -1.64372710e-02  6.53678409e-01 -4.25135994e+00]
Minimize the sum: 0.06331130861072956
Minimize the sum: 1115.8476339863835

Fitting Models to Data Graphically¶

Author: S.K. Cheng¶

2024-08-04¶

Introduction¶

Analytic Methods of Model Fitting¶

Chebyshev Approximation Criterion¶

Problem¶

Least-Squares Criterion¶

Applying the Least-Squares Criterion¶

Project¶

Conclusion¶