# Example
''' 
to generate 1000 random samples from a multivariate normal distribution with 
the specified mean vector and covariance matrix. Finally, we calculate the 
sample mean and sample covariance matrix from the generated samples.
'''
import numpy as np

# Define mean vector and covariance matrix
mean = np.array([1, 2, 3])  # Mean values for each variable
cov_matrix = np.array([[1, 0.5, 0.2],
                       [0.5, 2, 0.7],
                       [0.2, 0.7, 3]])  # Covariance matrix

# Generate random samples
num_samples = 1000
samples = np.random.multivariate_normal(mean, cov_matrix, num_samples)

samples

array([[2.58420809, 1.22145592, 2.36222512],
       [0.04496765, 1.50661912, 2.90042915],
       [1.53004047, 2.84612934, 1.30889197],
       ...,
       [3.14177554, 0.50289507, 1.32654185],
       [1.18476508, 3.73173457, 4.2904478 ],
       [2.21205365, 1.6127218 , 4.807605  ]])

mean

array([1, 2, 3])

# Print sample statistics
print("Sample Mean:", np.mean(samples, axis=0))
print("\nSample Covariance Matrix:")
print(np.cov(samples, rowvar=False))

Sample Mean: [1.01489746 1.9518071  2.9336716 ]

Sample Covariance Matrix:
[[0.98420241 0.47107553 0.24961479]
 [0.47107553 1.88734245 0.72539194]
 [0.24961479 0.72539194 3.04130146]]

# Monte Carlo simulation example
import numpy as np

# Define mean vector and covariance matrix
mean = np.array([1, 2])  # Mean values for X and Y
cov_matrix = np.array([[1, 0.5],
                       [0.5, 2]])  # Covariance matrix

# Set number of simulations and samples per simulation
num_simulations = 1000
num_samples = 100

# Run Monte Carlo simulations
results = []
for _ in range(num_simulations):
    samples = np.random.multivariate_normal(mean, cov_matrix, num_samples)
    # Perform calculations on the samples and store results
    simulation_result = np.mean(samples[:, 0]) + np.mean(samples[:, 1])
    results.append(simulation_result)

# Calculate statistics of the simulation results
mean_simulation = np.mean(results)
std_simulation = np.std(results)

# Print simulation statistics
print("Simulation Mean:", mean_simulation)
print("Simulation Standard Deviation:", std_simulation)

Simulation Mean: 2.9920839993485195
Simulation Standard Deviation: 0.19408450356219822

import numpy as np
import matplotlib.pyplot as plt

# Original Dataset
x = np.array([1, 2, 3, 4, 5])  # Independent variable
y = np.array([2, 4, 6, 8, 10])  # Dependent variable

# Calculate mean and covariance matrix of the original dataset
mean = np.array([np.mean(x), np.mean(y)])
cov_matrix = np.cov(x, y)

# Generate simulated data based on the original dataset properties
num_samples = 1000
simulated_data = np.random.multivariate_normal(mean, cov_matrix, num_samples).T

# Extract simulated x and y values
simulated_x = simulated_data[0]
simulated_y = simulated_data[1]

# Plotting the original and simulated data with modified color and marker
plt.scatter(x, y, label='Original Data', color='red', marker='o', s=50, alpha=0.8)
plt.scatter(simulated_x, simulated_y, label='Simulated Data', color='blue', marker='s', s=2, alpha=0.5)
plt.xlabel('X')
plt.ylabel('Y')
plt.title('Original and Simulated Data')
plt.legend()
plt.show()

import numpy as np
import matplotlib.pyplot as plt
from sklearn.linear_model import LinearRegression

# Original Dataset
np.random.seed(0)
mean = [0, 0]
cov_matrix = [[1, 0.8], [0.8, 2]]
num_samples = 100

# Generate simulated data based on the original dataset properties
simulated_data = np.random.multivariate_normal(mean, cov_matrix, num_samples).T

# Extract simulated variables
x = simulated_data[0]
y = simulated_data[1]

# Fit a linear regression model
regression_model = LinearRegression()
regression_model.fit(x.reshape(-1, 1), y)

# Generate predictions using the fitted model
x_range = np.linspace(np.min(x), np.max(x), 100)
y_pred = regression_model.predict(x_range.reshape(-1, 1))

# Plotting the original data and regression line
plt.scatter(x, y, label='Simulated Data')
plt.plot(x_range, y_pred, color='red', label='Regression Line')
plt.xlabel('X')
plt.ylabel('Y')
plt.title('Linear Regression')
plt.legend()
plt.show()

Covariance matrix¶

Author: Arun Kumar Pandey

Mathematical Formulation¶

Importance of covariance matrix¶