Answered step by step

Verified Expert Solution

Link Copied!

Question

1 Approved Answer

Posted on Aug 28, 2024

# A klay c dosya olan 'agaricus - lepiota.names' dosyas n okuyarak i eri ine bak yoruz . file _ path = 'agaricus - lepiota.names'

# A

klay

dosya olan 'agaricus

-

lepiota.names' dosyas

okuyarak i

eri

ine bak

yoruz

.

file

_

path

=

'agaricus

-

lepiota.names'

# Dosyan

n i

eri

ini okuma

with open

(

file

_

path,

'

')

as file:

names

_

content

=

file.read

()

eri

in ilk

10000

karakterini g

stermek i

in k

saltma yaparak i

eri

i g

sterelim

(

names

_

content

[

10000])

10000

karakteri g

steriyoruz

.

% %

import pandas as pd

# Veri setini okuyarak DataFrame olu

turma

data

_

file

_

path

=

'agaricus

-

lepiota.data.csv

'

column

_

names

= ['

class

',

'cap

-

shape', 'cap

-

surface', 'cap

-

color', 'bruises', 'odor',

'gill

-

attachment', 'gill

-

spacing', 'gill

-

size', 'gill

-

color',

'stalk

-

shape', 'stalk

-

root', 'stalk

-

surface

-

above

-

ring',

'stalk

-

surface

-

below

-

ring', 'stalk

-

color

-

above

-

ring',

'stalk

-

color

-

below

-

ring', 'veil

-

type', 'veil

-

color', 'ring

-

number',

'ring

-

type', 'spore

-

-

color', 'population', 'habitat'

]

mushroom

_

data

=

.

read

_

csv

(

data

_

file

_

path, header

=

None, names

=

column

_

names

)

5

sat

stererek veri yap

inceleyelim

mushroom

_

data.head

()

% %

(

mushroom

_

data.describe

())

% %

mushroom

_

data.info

()

#All features are categorical but given as 'object' type. First, it is converted into 'category' type.

% %

from plotly.subplots import make

_

subplots

import plotly.graph

_

objects as go

specs

= [[{'

type

'

:'domain'

}, {'

type

'

:'domain'

}, {'

type

'

:'domain'

}, {'

type

'

:'domain'

}, {'

type

'

:'domain'

}], [{'

type

'

:'domain'

}, {'

type

'

:'domain'

}, {'

type

'

:'domain'

}, {'

type

'

:'domain'

}, {'

type

'

:'domain'

}], [{'

type

'

:'domain'

}, {'

type

'

:'domain'

}, {'

type

'

:'domain'

}, {'

type

'

:'domain'

}, {'

type

'

:'domain'

}], [{'

type

'

:'domain'

}, {'

type

'

:'domain'

}, {'

type

'

:'domain'

}, {'

type

'

:'domain'

}, {'

type

'

:'domain'

}], [{'

type

'

:'domain'

}, {'

type

'

:'domain'

}, {'

type

'

:'domain'

}, {'

type

'

:'domain'

}, {'

type

'

:'domain'

}]]

fig

=

make

_

subplots

(

rows

= 5,

cols

= 5,

specs

=

specs

)

= 1

= 1

= - 0.172

= 1.267

= []

for col in mushroom

_

data.columns:

fig.add

_

trace

(

.

Pie

(

labels

= [

n for n in mushroom

_

data

[

col

] .

value

_

counts

() .

index

],

values

= [

v for v in mushroom

_

data

[

col

] .

value

_

counts

() * 100 /

sum

(

mushroom

_

data

[

col

] .

value

_

counts

())],

name

=

col

),

,

)

.

append

(

dict

(

text

=

col, x

=

+ (0.225 *

),

=

- (0.222 *

),

font

_

size

= 10,

showarrow

=

False

))

+ = 1

if a

> 5

= 1

+ = 1

fig.update

(

layout

_

title

_

text

=

'Features',

layout

_

showlegend

=

False

)

fig.update

_

layout

(

title

_

font

_

family

=

"Arial",

title

_

font

_

size

= 25,

annotations

=

)

fig.update

_

traces

(

hole

= . 4,

hoverinfo

=

"label

+

percent

+

name",textinfo

=

'none'

)

fig.show

()

% %

def make

_

categorical

(

mushroom

_

data, columns

)

for column in columns:

mushroom

_

data

[

column

] =

.

Categorical

(

mushroom

_

data

[

column

])

return mushroom

_

data

% %

columns

=

mushroom

_

data.columns

data

=

make

_

categorical

(

mushroom

_

data, columns

)

% %

mushroom

_

data.info

()

% %

mushroom

_

data.shape

#There

8124

observation and

23

features in mushroom dataset.

% %

mushroom

_

data.isnull

() .

any

()

#There is no missing value in mushroom dataset.

% %

# Veri t

rleri incelemesi

data

_

types

=

mushroom

_

data.dtypes

data

_

types

% %

mushroom

_

data

_

habitat

=

mushroom

_

data

['

habitat

'] .

groupby

(

mushroom

_

data

['

class

']) .

value

_

counts

(

normalize

=

True

) .

rename

('

frequency

') .

_

frame

() .

reset

_

index

()

mushroom

_

data

_

habitat

% %

from matplotlib import pyplot as plt

import seaborn as sns

# Let

`

s create a bar plot to show the Habitat Distribution

sns

.

barplot

(

data

=

mushroom

_

data

_

habitat,x

=

'habitat',y

=

'frequency',hue

=

'class'

)

plt

.

xlabel

('

Habitat

')

plt

.

ylabel

('

frequenncy

(%)')

plt

.

title

("

Habitat Distribution: Edible Vs Poisonous"

)

;

% %

mushroom

_

data

_

popu

=

mushroom

_

data

['

population

'] .

groupby

(

mushroom

_

data

['

class

']) .

value

_

counts

(

normalize

=

True

) .

rename

('

frequency

') .

_

frame

() .

reset

_

index

()

mushroom

_

data

_

popu

% %

## Let

`

s create a bar plot to show the population: Edible Vs Poisonous

import plotly.express as px

fig

=

.

bar

(

data

_

frame

=

mushroom

_

data

_

popu

,

=

'population', y

=

'frequency',color

=

'class', barmode

=

'group', title

=

'population: Edible Vs Poisonous'

)

fig.update

_

layout

(

xaxis

_

title

=

'population'

,

yaxis

_

title

=

'frequenncy

(%)')

% %

ring

_

num

= {

'

'

1,

'

'

2,

'

'

0

}

ring

_

num

mushroom

_

data

_

ring

=

mushroom

_

data

['

ring

-

number'

] .

replace

(

ring

_

num

) .

groupby

(

mushroom

_

data

['

class

']) .

value

_

counts

(

normalize

=

True

) .

rename

('

frequency

') .

_

frame

() .

reset

_

index

()

mushroom

_

data

_

ring

% %

#Let

`

s create a barchart to visualize the number of rings in each class

fig

=

.

bar

(

data

_

frame

=

mushroom

_

data

_

ring

,

=

'ring

-

number'

,

=

'frequency'

,

color

=

'class'

,

barmode

=

'group',title

=

'Number of rings: Edible Vs Poisonous'

)

fig.update

_

layout

(

xaxis

_

title

=

'number of rings'

,

yaxis

_

title

=

'frequency

(%)')

THE PYTHON CODE GIVEN ABOVE IS RELATED TO RANDOM FOREST CLASSIFICATION IN THE DATA SCIENCE COURSE.

PLEASE INTERPRET THIS CODE AND PREPARE A REPORT ACCORDING TO THE SUBJECTS AND CODES.

Step by Step Solution

There are 3 Steps involved in it

Step: 1

Get Instant Access to Expert-Tailored Solutions

See step-by-step solutions with expert insights and AI powered tools for academic success

Step: 2

Step: 3

Ace Your Homework with AI

Get the answers you need in no time with our AI-driven, step-by-step assistance

Get Started

Recommended Textbook for

Practical Database Auditing For Microsoft SQL Server And Azure SQL Troubleshooting Regulatory Compliance And Governance

Authors: Josephine Bush

1st Edition

★★★★★

(Appendices) ENDING INVENTORY AND COST OF GOODS SOLD. Hempstead Company has the following data for 19x9: LO8

Answered: 1 week ago

Previous Question Next Question