{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"metadata": {
"collapsed": true
},
"outputs": [],
"source": [
"import pandas as pd"
]
},
{
"cell_type": "code",
"execution_count": 2,
"metadata": {
"collapsed": true
},
"outputs": [],
"source": [
"d = {'AÑO': [2001, 2003, 2003, 2001],\n",
" 'SEXO': ['MASCULINO', 'FEMENINO', 'FEMENINO', 'FEMENINO'],\n",
" 'GENERO MUSICAL': ['BACHATA, SALSA', 'POP, SALSA', 'POP', 'POP, COUNTRY']}"
]
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {
"collapsed": false
},
"outputs": [
{
"data": {
"text/html": [
"
\n",
"
\n",
" \n",
" \n",
" | \n",
" AÑO | \n",
" GENERO MUSICAL | \n",
" SEXO | \n",
"
\n",
" \n",
" \n",
" \n",
" 0 | \n",
" 2001 | \n",
" BACHATA, SALSA | \n",
" MASCULINO | \n",
"
\n",
" \n",
" 1 | \n",
" 2003 | \n",
" POP, SALSA | \n",
" FEMENINO | \n",
"
\n",
" \n",
" 2 | \n",
" 2003 | \n",
" POP | \n",
" FEMENINO | \n",
"
\n",
" \n",
" 3 | \n",
" 2001 | \n",
" POP, COUNTRY | \n",
" FEMENINO | \n",
"
\n",
" \n",
"
\n",
"
"
],
"text/plain": [
" AÑO GENERO MUSICAL SEXO\n",
"0 2001 BACHATA, SALSA MASCULINO\n",
"1 2003 POP, SALSA FEMENINO\n",
"2 2003 POP FEMENINO\n",
"3 2001 POP, COUNTRY FEMENINO"
]
},
"execution_count": 3,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"genero_data = pd.DataFrame(d)\n",
"genero_data"
]
},
{
"cell_type": "code",
"execution_count": 4,
"metadata": {
"collapsed": false
},
"outputs": [
{
"data": {
"text/plain": [
"POP 3\n",
" SALSA 2\n",
"BACHATA 1\n",
" COUNTRY 1\n",
"Name: GENERO, dtype: int64"
]
},
"execution_count": 4,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"musica = genero_data['GENERO MUSICAL'].str.split(',').apply(pd.Series, 1).stack()\n",
"musica.index = musica.index.droplevel(-1)\n",
"musica.name='GENERO'\n",
"pd.value_counts(musica)"
]
},
{
"cell_type": "code",
"execution_count": 5,
"metadata": {
"collapsed": false
},
"outputs": [
{
"data": {
"text/html": [
"\n",
"
\n",
" \n",
" \n",
" | \n",
" AÑO | \n",
" SEXO | \n",
" GENERO | \n",
"
\n",
" \n",
" \n",
" \n",
" 0 | \n",
" 2001 | \n",
" MASCULINO | \n",
" BACHATA | \n",
"
\n",
" \n",
" 0 | \n",
" 2001 | \n",
" MASCULINO | \n",
" SALSA | \n",
"
\n",
" \n",
" 1 | \n",
" 2003 | \n",
" FEMENINO | \n",
" POP | \n",
"
\n",
" \n",
" 1 | \n",
" 2003 | \n",
" FEMENINO | \n",
" SALSA | \n",
"
\n",
" \n",
" 2 | \n",
" 2003 | \n",
" FEMENINO | \n",
" POP | \n",
"
\n",
" \n",
" 3 | \n",
" 2001 | \n",
" FEMENINO | \n",
" POP | \n",
"
\n",
" \n",
" 3 | \n",
" 2001 | \n",
" FEMENINO | \n",
" COUNTRY | \n",
"
\n",
" \n",
"
\n",
"
"
],
"text/plain": [
" AÑO SEXO GENERO\n",
"0 2001 MASCULINO BACHATA\n",
"0 2001 MASCULINO SALSA\n",
"1 2003 FEMENINO POP\n",
"1 2003 FEMENINO SALSA\n",
"2 2003 FEMENINO POP\n",
"3 2001 FEMENINO POP\n",
"3 2001 FEMENINO COUNTRY"
]
},
"execution_count": 5,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"del genero_data['GENERO MUSICAL']\n",
"genero_data = genero_data.join(musica)\n",
"genero_data"
]
},
{
"cell_type": "code",
"execution_count": 6,
"metadata": {
"collapsed": false
},
"outputs": [
{
"data": {
"text/plain": [
"POP 3\n",
" SALSA 2\n",
"BACHATA 1\n",
" COUNTRY 1\n",
"Name: GENERO, dtype: int64"
]
},
"execution_count": 6,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"pd.value_counts(genero_data['GENERO'])"
]
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.5.2"
}
},
"nbformat": 4,
"nbformat_minor": 0
}