2 Sat
TIL
[์ธํ๋ฐ] ๋จ ๋ ์ฅ์ ๋ฌธ์๋ก ๋ฐ์ดํฐ ๋ถ์๊ณผ ์๊ฐํ ๋ฝ๊ฐ๊ธฐ
์ผ๋ถ ์ปฌ๋ผ์ ๊ธฐ์ค์ผ๋ก ๋ฐ์ดํฐ ๊ฐ์ ธ์ค๊ธฐ - Subset Variables (Columns)
import seaborn as sns
df = sns.load_dataset("iris")
df.head()
sepal_length
sepal_width
petal_length
petal_width
species
0
5.1
3.5
1.4
0.2
setosa
1
4.9
3.0
1.4
0.2
setosa
2
4.7
3.2
1.3
0.2
setosa
3
4.6
3.1
1.5
0.2
setosa
4
5.0
3.6
1.4
0.2
setosa
columns = ['sepal_length', 'sepal_width', 'species']
df[columns].head()
sepal_length
sepal_width
species
0
5.1
3.5
setosa
1
4.9
3.0
setosa
2
4.7
3.2
setosa
3
4.6
3.1
setosa
4
5.0
3.6
setosa
df['sepal_width'].head()
0 3.5
1 3.0
2 3.2
3 3.1
4 3.6
Name: sepal_width, dtype: float64
df.sepal_width.head()
0 3.5
1 3.0
2 3.2
3 3.1
4 3.6
Name: sepal_width, dtype: float64
df.filter(regex='regex').head(5)
0
1
2
3
4
ํ์ฌ๋ ์กฐ๊ฑด์ด ์์ด์ ์ธ๋ฑ์ค๋ง ์ถ์ถ
df.filter(regex='\.').head(5)
0
1
2
3
4
'.' ์ด ๋ค์ด๊ฐ column์ ์ถ์ถํ๋ค. ์ด ๋๋ '.'์ด ๋ค์ด๊ฐ column์ด ์๋ค. ๋ํ '.'์ ์ ๊ท์์์ ๋ค๋ฅธ ์๋ฏธ๋ก๋ ์ฐ์ด๊ธฐ ๋๋ฌธ์ \. ๋ก ์ฌ์ฉํ๋ค.
df.filter(regex='_').head(5)
sepal_length
sepal_width
petal_length
petal_width
0
5.1
3.5
1.4
0.2
1
4.9
3.0
1.4
0.2
2
4.7
3.2
1.3
0.2
3
4.6
3.1
1.5
0.2
4
5.0
3.6
1.4
0.2
df.filter(regex='length$').head(5)
sepal_length
petal_length
0
5.1
1.4
1
4.9
1.4
2
4.7
1.3
3
4.6
1.5
4
5.0
1.4
$๊ฐ ๋ค์์ค๋ฉด ํน์ ๋ฌธ์๋ก ๋๋๋ ๊ฒฐ๊ณผ๋ง ์ถ์ถํ๋ค.
df.filter(regex='^sepal').head(5)
sepal_length
sepal_width
0
5.1
3.5
1
4.9
3.0
2
4.7
3.2
3
4.6
3.1
4
5.0
3.6
^๊ฐ ์์์ค๋ฉด ํน์ ๋ฌธ์๋ก ์์ํ๋ ๊ฒฐ๊ณผ๋ง ์ถ์ถํ๋ค.
df.filter(regex='^(?!Species$).*').head(5)
sepal_length
sepal_width
petal_length
petal_width
species
0
5.1
3.5
1.4
0.2
setosa
1
4.9
3.0
1.4
0.2
setosa
2
4.7
3.2
1.3
0.2
setosa
3
4.6
3.1
1.5
0.2
setosa
4
5.0
3.6
1.4
0.2
setosa
loc๋ฅผ ์ด์ฉํด์ ๋ฒ์ ์ค์ ์ ํ ์ ์๋ค.
df.loc[2:5, 'sepal_width':'petal_width']
sepal_width
petal_length
petal_width
2
3.2
1.3
0.2
3
3.1
1.5
0.2
4
3.6
1.4
0.2
5
3.9
1.7
0.4
df.iloc[-5:, [1,2,4]]
sepal_width
petal_length
species
145
3.0
5.2
virginica
146
2.5
5.0
virginica
147
3.0
5.2
virginica
148
3.4
5.4
virginica
149
3.0
5.1
virginica
df.loc[df['sepal_length'] > 5], ['sepal_length','sepal_width']
( sepal_length sepal_width petal_length petal_width species
0 5.1 3.5 1.4 0.2 setosa
5 5.4 3.9 1.7 0.4 setosa
10 5.4 3.7 1.5 0.2 setosa
14 5.8 4.0 1.2 0.2 setosa
15 5.7 4.4 1.5 0.4 setosa
.. ... ... ... ... ...
145 6.7 3.0 5.2 2.3 virginica
146 6.3 2.5 5.0 1.9 virginica
147 6.5 3.0 5.2 2.0 virginica
148 6.2 3.4 5.4 2.3 virginica
149 5.9 3.0 5.1 1.8 virginica
[118 rows x 5 columns],
['sepal_length', 'sepal_width'])
Last updated
Was this helpful?