Answered step by step

Verified Expert Solution

Link Copied!

Question

1 Approved Answer

Posted on Sep 12, 2024

Code 1 : import numpy as np import pandas as pd from PIL import Image from sklearn.preprocessing import StandardScaler # Initialize dataframe df = pd

Code

1

import numpy as np

import pandas as pd

from PIL import Image

from sklearn.preprocessing import StandardScaler

# Initialize dataframe

=

.

DataFrame

(

.

zeros

((400, 2576)))

count

= 0

for i in range

(40)

for j in range

(10)

image

=

Image.open

(" /

Users

/

ORL

_

Faces

/ " +

str

(

+ 1) + "_" +

str

(

+ 1) + " .

png

")

image

_

array

=

.

array

(

image

)

image

_

array

=

image

_

array.reshape

(1, - 1)

.

iloc

[

count

] =

image

_

array

count

+ = 1

# Add gender labels to the dataframe

["

Gender

"] =

.

ones

((400, 1))

# Modify certain entries to represent actual gender labels

.

iloc

[0

10, 2576] = 0.0

.

iloc

[70

80, 2576] = 0.0

.

iloc

[90

100, 2576] = 0.0

.

iloc

[310

320, 2576] = 0.0

from sklearn.cluster import KMeans

# Standardize image data

=

.

iloc

[

, 0

2576]

scaler

=

StandardScaler

()

=

scaler.fit

_

transform

(

)

# Apply KMeans clustering

kmeans

_

model

=

KMeans

(

_

clusters

= 2)

kmeans

_

model.fit

(

)

# Add cluster labels to the dataframe

["

KMeans

_

Clusters"

] =

kmeans

_

model.labels

_

from sklearn.cluster import AgglomerativeClustering

from sklearn.preprocessing import StandardScaler

import pandas as pd

# Assuming df is your dataframe and it has been loaded correctly

=

.

iloc

[

, 0

2576]

# Adjust the slice as necessary to include the right columns

# Standardize image data for hierarchical clustering

scaler

=

StandardScaler

()

_

scaled

=

scaler.fit

_

transform

(

)

# Apply Hierarchical clustering using Ward's method

hierarchical

_

cluster

=

AgglomerativeClustering

(

_

clusters

= 2,

linkage

=

'ward'

)

hierarchical

_

cluster.fit

(

_

scaled

)

# Add cluster labels to the dataframe

["

Hierarchical

_

Clusters"

] =

hierarchical

_

cluster.labels

_

# Calculate true and false labelings for K

-

Means clustering

true

_

label

_

kmeans

=

sum

(

["

KMeans

_

Clusters"

] = =

["

Gender

"])

false

_

label

_

kmeans

=

sum

(

["

KMeans

_

Clusters"

]! =

["

Gender

"])

# Calculate true and false labelings for Hierarchical clustering

true

_

label

_

hierarchical

=

sum

(

["

Hierarchical

_

Clusters"

] = =

["

Gender

"])

false

_

label

_

hierarchical

=

sum

(

["

Hierarchical

_

Clusters"

]! =

["

Gender

"])

import matplotlib.pyplot as plt

plt

.

figure

(

figsize

= (10, 5))

plt

.

subplot

(1, 2, 1)

plt

.

scatter

(

true

_

label

_

kmeans, false

_

label

_

kmeans, color

=

'blue'

)

plt

.

title

('

-

Means Clustering'

)

plt

.

xlabel

('

True Labels'

)

plt

.

ylabel

('

False Labels'

)

plt

.

subplot

(1, 2, 2)

plt

.

scatter

(

true

_

label

_

hierarchical, false

_

label

_

hierarchical, color

=

'red'

)

plt

.

title

('

Hierarchical Clustering'

)

plt

.

xlabel

('

True Labels'

)

plt

.

ylabel

('

False Labels'

)

plt

.

tight

_

layout

()

plt

.

show

()

("

-

Means Clustering Results:"

)

("

# of True Labeling:", true

_

label

_

kmeans

)

("

# of False Labeling:", false

_

label

_

kmeans

)

("

Hierarchical Clustering Results:"

)

("

# of True Labeling:", true

_

label

_

hierarchical

)

("

# of False Labeling:", false

_

label

_

hierarchical

)

Code

2

import numpy as np

import matplotlib.pyplot as plt

from sklearn.datasets import fetch

_

olivetti

_

faces, load

_

digits

from sklearn.cluster import KMeans, AgglomerativeClustering

from sklearn.metrics import silhouette

_

score

try:

# Try to fetch the Olivetti faces dataset

data

=

fetch

_

olivetti

_

faces

()

=

data.data

=

data.target

dataset

_

name

=

"Olivetti Faces"

except Exception as e:

("

Failed to fetch Olivetti Faces dataset:", e

)

# Fallback to a different dataset, e

.

.,

load

_

digits

data

=

load

_

digits

()

=

data.data

=

data.target

dataset

_

name

=

"Digits"

# Apply k

-

means clustering

kmeans

=

KMeans

(

_

clusters

= 2,

random

_

state

= 42)

kmeans

_

labels

=

kmeans.fit

_

predict

(

)

# Apply hierarchical clustering

hierarchical

=

AgglomerativeClustering

(

_

clusters

= 2)

hierarchical

_

labels

=

hierarchical.fit

_

predict

(

)

# Evaluate clustering performance using silhouette score

kmeans

_

score

=

silhouette

_

score

(

,

kmeans

_

labels

)

hierarchical

_

score

=

silhouette

_

score

(

,

hierarchical

_

labels

)

# Print the silhouette scores

(

"

Silhouette Score for K

-

Means on

{

dataset

_

name

}

",

kmeans

_

score

)

(

"

Silhouette Score for Hierarchical Clustering on

{

dataset

_

name

}

",

hierarchical

_

score

)

# Visualize the clustering results

plt

.

figure

(

figsize

= (12, 6))

plt

.

subplot

(1, 2, 1)

plt

.

scatter

(

[

, 0],

[

, 1],

=

kmeans

_

labels, cmap

=

'viridis', s

= 10)

plt

.

title

(

"

-

Means Clustering on

{

dataset

_

name

} ")

plt

.

xlabel

("

Feature

1 ")

plt

.

ylabel

("

Feature

2 ")

plt

.

subplot

(1, 2, 2)

plt

.

scatter

(

[

, 0],

[

, 1],

=

hierarchical

_

labels, cmap

=

'viridis', s

= 10)

plt

.

title

(

"

Hierarchical Clustering on

{

dataset

_

name

} ")

plt

.

xlabel

("

Feature

1 ")

plt

.

ylabel

("

Feature

2 ")

plt

.

tight

_

layout

()

plt

.

show

()

Please use the dataset of Code

1 (

the link

)

for Code

2,

combine the

2

codes together, and give me the complete code. Thank you!:

)

Step by Step Solution

There are 3 Steps involved in it

Step: 1

Get Instant Access to Expert-Tailored Solutions

See step-by-step solutions with expert insights and AI powered tools for academic success

Step: 2

Step: 3

Ace Your Homework with AI

Get the answers you need in no time with our AI-driven, step-by-step assistance

Get Started

Recommended Textbook for

Inference Control In Statistical Databases From Theory To Practice Lncs 2316

Authors: Josep Domingo-Ferrer

2002nd Edition

★★★★★

Over a 24-hour period, observe and record oral and written communication that you would classify as negative messages because they are unpleasant, disappointing, or upsetting to the receiver. Record...

Answered: 1 week ago

Previous Question Next Question