{ "cells": [ { "cell_type": "code", "execution_count": 1, "metadata": { "collapsed": true }, "outputs": [], "source": [ "import pandas as pd" ] }, { "cell_type": "code", "execution_count": 2, "metadata": { "collapsed": true }, "outputs": [], "source": [ "d = {'AÑO': [2001, 2003, 2003, 2001],\n", " 'SEXO': ['MASCULINO', 'FEMENINO', 'FEMENINO', 'FEMENINO'],\n", " 'GENERO MUSICAL': ['BACHATA, SALSA', 'POP, SALSA', 'POP', 'POP, COUNTRY']}" ] }, { "cell_type": "code", "execution_count": 3, "metadata": { "collapsed": false }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
AÑOGENERO MUSICALSEXO
02001BACHATA, SALSAMASCULINO
12003POP, SALSAFEMENINO
22003POPFEMENINO
32001POP, COUNTRYFEMENINO
\n", "
" ], "text/plain": [ " AÑO GENERO MUSICAL SEXO\n", "0 2001 BACHATA, SALSA MASCULINO\n", "1 2003 POP, SALSA FEMENINO\n", "2 2003 POP FEMENINO\n", "3 2001 POP, COUNTRY FEMENINO" ] }, "execution_count": 3, "metadata": {}, "output_type": "execute_result" } ], "source": [ "genero_data = pd.DataFrame(d)\n", "genero_data" ] }, { "cell_type": "code", "execution_count": 4, "metadata": { "collapsed": false }, "outputs": [ { "data": { "text/plain": [ "POP 3\n", " SALSA 2\n", "BACHATA 1\n", " COUNTRY 1\n", "Name: GENERO, dtype: int64" ] }, "execution_count": 4, "metadata": {}, "output_type": "execute_result" } ], "source": [ "musica = genero_data['GENERO MUSICAL'].str.split(',').apply(pd.Series, 1).stack()\n", "musica.index = musica.index.droplevel(-1)\n", "musica.name='GENERO'\n", "pd.value_counts(musica)" ] }, { "cell_type": "code", "execution_count": 5, "metadata": { "collapsed": false }, "outputs": [ { "data": { "text/html": [ "
\n", "\n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", " \n", "
AÑOSEXOGENERO
02001MASCULINOBACHATA
02001MASCULINOSALSA
12003FEMENINOPOP
12003FEMENINOSALSA
22003FEMENINOPOP
32001FEMENINOPOP
32001FEMENINOCOUNTRY
\n", "
" ], "text/plain": [ " AÑO SEXO GENERO\n", "0 2001 MASCULINO BACHATA\n", "0 2001 MASCULINO SALSA\n", "1 2003 FEMENINO POP\n", "1 2003 FEMENINO SALSA\n", "2 2003 FEMENINO POP\n", "3 2001 FEMENINO POP\n", "3 2001 FEMENINO COUNTRY" ] }, "execution_count": 5, "metadata": {}, "output_type": "execute_result" } ], "source": [ "del genero_data['GENERO MUSICAL']\n", "genero_data = genero_data.join(musica)\n", "genero_data" ] }, { "cell_type": "code", "execution_count": 6, "metadata": { "collapsed": false }, "outputs": [ { "data": { "text/plain": [ "POP 3\n", " SALSA 2\n", "BACHATA 1\n", " COUNTRY 1\n", "Name: GENERO, dtype: int64" ] }, "execution_count": 6, "metadata": {}, "output_type": "execute_result" } ], "source": [ "pd.value_counts(genero_data['GENERO'])" ] } ], "metadata": { "kernelspec": { "display_name": "Python 3", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.5.2" } }, "nbformat": 4, "nbformat_minor": 0 }