# Import libraries
import os
import pandas as pd #pd is a convenient shortform for pandas
import numpy as np #np is a convenient shortform for numpy
import seaborn as sns #sns is a convenient shortform for seaborn
import matplotlib.pyplot as plt #plt is a convenient shortform for matplotlib

# Create a Pandas DataFrame for Nvidia dataset
NVDA_df = pd.read_csv("/home/jovyan/work/rico-kanthatham/datasets/Nvidia_stock_data.csv")  #path to CSV file

# Looking at a desired number of Data Rows
NVDA_df.head(10) #defaults to providing first 5 rows of data...enter an integer as an arguement to see a specific number of rows

# Make sure Date is parsed as datetime
NVDA_df['Date'] = pd.to_datetime(NVDA_df['Date']) #date column data converted to date

# Create scatter plot
plt.figure(figsize=(12,6)) #graph width & height
plt.scatter(NVDA_df['Date'], NVDA_df['Close'], color='red', s = 0.5) #bar graph closing px value (y axis) at every date value (x axis)...red color bars

plt.xlabel("Date")
plt.ylabel("Closing Price")
plt.title("Historic Closing Price")
plt.xticks(rotation=45) # rotate x-axis label 45deg

# plt.tight_layout()
plt.show()

# Import libraries
import os
import pandas as pd #pd is a convenient shortform for pandas
import numpy as np #np is a convenient shortform for numpy
# import seaborn as sns #sns is a convenient shortform for seaborn
import matplotlib.pyplot as plt #plt is a convenient shortform for matplotlib

# Create a Pandas DataFrame for Nvidia dataset
NVDA_df = pd.read_csv("/home/jovyan/work/rico-kanthatham/datasets/Nvidia_stock_data.csv")  #path to CSV file

# Looking at a desired number of Data Rows
NVDA_df.head(10) #defaults to providing first 5 rows of data...enter an integer as an arguement to see a specific number of rows

# Make sure Date is parsed as datetime
NVDA_df['Date'] = pd.to_datetime(NVDA_df['Date']) #date column data converted to date

# Create and Assign XY Variables  
x = NVDA_df['Date']
y = NVDA_df['Close']

# Create scatter plot 
plt.figure(figsize=(12,6)) #graph width & height
plt.scatter(x, y, color='red', s = 0.5) #bar graph closing px value (y axis) at every date value (x axis)...red color bars

plt.xlabel("Date")
plt.ylabel("Closing Price")
plt.title("Historic Closing Price")
plt.xticks(rotation=45) # rotate x-axis label 45deg

# plt.tight_layout()
plt.show()

# Polynomial Fit Functions
cL = np.polyfit(x,y,1) #generate coefficients for a linear Fit Function
cQ = np.polyfit(x,y,2) #generate coefficients for a Quadratic Fit Function
L = np.poly1d(cL)
print(L)

---------------------------------------------------------------------------
UFuncTypeError                            Traceback (most recent call last)
Cell In[3], line 34
     31 plt.show()
     33 # Polynomial Fit Functions
---> 34 cL = np.polyfit(x,y,1) #generate coefficients for a linear Fit Function
     35 # cQ = np.polyfit(x,y,2) #generate coefficients for a Quadratic Fit Function
     36 # L = np.poly1d(cL)
     37 # print(L)

File /opt/conda/lib/python3.13/site-packages/numpy/lib/_polynomial_impl.py:636, in polyfit(x, y, deg, rcond, full, w, cov)
    460 """
    461 Least squares polynomial fit.
    462 
   (...)    633 
    634 """
    635 order = int(deg) + 1
--> 636 x = NX.asarray(x) + 0.0
    637 y = NX.asarray(y) + 0.0
    639 # check arguments.

UFuncTypeError: ufunc 'add' cannot use operands with types dtype('<M8[ns]') and dtype('float64')

# Import libraries
import os
import pandas as pd #pd is a convenient shortform for pandas
import numpy as np #np is a convenient shortform for numpy
# import seaborn as sns #sns is a convenient shortform for seaborn
import matplotlib.pyplot as plt #plt is a convenient shortform for matplotlib

# Create a Pandas DataFrame for Nvidia dataset
NVDA_df = pd.read_csv("/home/jovyan/work/rico-kanthatham/datasets/Nvidia_stock_data.csv")  #path to CSV file

# Looking at a desired number of Data Rows
NVDA_df.head(10) #defaults to providing first 5 rows of data...enter an integer as an arguement to see a specific number of rows

# Make sure Date is parsed as datetime
NVDA_df['Date'] = pd.to_datetime(NVDA_df['Date']) #date column data converted to date

# Create and Assign XY Variables  
x = np.arange(len(NVDA_df['Date']))
y = NVDA_df['Close']

# Create scatter plot 
plt.figure(figsize=(12,6)) #graph width & height
plt.scatter(x, y, color='red', s = 0.5) #bar graph closing px value (y axis) at every date value (x axis)...red color bars

plt.xlabel("Date")
plt.ylabel("Closing Price")
plt.title("Historic Closing Price")
plt.xticks(rotation=45) # rotate x-axis label 45deg

# plt.tight_layout()
plt.show()

# Polynomial Fit Functions
cL = np.polyfit(x,y,1) #generate coefficients for a linear Fit Function
cQ = np.polyfit(x,y,2) #generate coefficients for a Quadratic Fit Function
L = np.poly1d(cL)
print('Linear Coefficient: ', L)

Linear Coefficient:   
0.009793 x - 20.14

# Import libraries
import os
import pandas as pd #pd is a convenient shortform for pandas
import numpy as np #np is a convenient shortform for numpy
# import seaborn as sns #sns is a convenient shortform for seaborn
import matplotlib.pyplot as plt #plt is a convenient shortform for matplotlib

# Create a Pandas DataFrame for Nvidia dataset
NVDA_df = pd.read_csv("/home/jovyan/work/rico-kanthatham/datasets/Nvidia_stock_data.csv")  #path to CSV file

# Looking at a desired number of Data Rows
NVDA_df.head(10) #defaults to providing first 5 rows of data...enter an integer as an arguement to see a specific number of rows

# Make sure Date is parsed as datetime
NVDA_df['Date'] = pd.to_datetime(NVDA_df['Date']) #date column data converted to date

# Create and Assign XY Variables  
x = np.arange(len(NVDA_df['Date']))
y = NVDA_df['Close']

# Create scatter plot 
plt.figure(figsize=(12,6)) #graph width & height
plt.scatter(x, y, color='red', s = 0.5) #bar graph closing px value (y axis) at every date value (x axis)...red color bars

plt.xlabel("Date")
plt.ylabel("Closing Price")
plt.title("Historic Closing Price")
plt.xticks(rotation=45) # rotate x-axis label 45deg

# plt.tight_layout()
plt.show() #show the closing price as a scatter plot

# Polynomial Fit Functions
cL = np.polyfit(x,y,1) #generate coefficients for a linear Fit Function
cQ = np.polyfit(x,y,2) #generate coefficients for a Quadratic Fit Function
L = np.poly1d(cL)
Q = np.poly1d(cQ)
print(f"Linear Coefficient: {L}")
print(f"Quadratic Coefficient: {Q}")

Linear Coefficient:  
0.009793 x - 20.14
Quadratic Coefficient:            2
5.523e-06 x - 0.02749 x + 21.81

# Plot the Linear Fit Line

x_lin = np.arange(min(x), max(x))
y_linModel = L(x_lin)
plt.scatter(x, y, color='red', s = 0.5) 
plt.plot(x_lin, y_linModel)

[<matplotlib.lines.Line2D at 0xfe7180d65d10>]

# Plot the Quadratic Fit Line

x_quad = np.arange(min(x), max(x))
y_quadModel = Q(x_quad)
plt.scatter(x, y, color='red', s = 0.5) 
plt.plot(x_quad, y_quadModel)

[<matplotlib.lines.Line2D at 0xfe7180e4b4d0>]

# Plot Linear and Quadratic Fit Lines over Scatter Plot

x_quad = np.arange(min(x), max(x))
y_quadModel = Q(x_quad)
plt.plot(x_quad, y_quadModel)

x_lin = np.arange(min(x), max(x))
y_linModel = L(x_lin)
plt.plot(x_lin, y_linModel)

plt.scatter(x, y, color='red', s = 0.5)

<matplotlib.collections.PathCollection at 0xfe7180ba9f90>

Data Science/Session 3 > Fitting Function¶

Class Notes¶

Math > Fitting Functions¶

Variable Types¶

Functions¶

Straight Line > $y = ax$¶

Affine > $y = ax+b$¶

Errors¶

Fitting¶

Radial Basis Function Fit (RBF)¶

Non-Linear Least Squares¶

Assignment:¶

Assignment Research¶

Assignment Work¶

Prepping for Fitting Function > Visualize Data as Scatter Plot¶

Fitting a Function to Data¶

Observations¶