\n", " | text | \n", "movie_name | \n", "category_name | \n", "
---|---|---|---|
0 | \n", "A senior at an elite college (Katie Holmes), a... | \n", "abandon | \n", "Plot | \n", "
1 | \n", "Will Lightman is a hip Londoner who one day re... | \n", "about_a_boy | \n", "Plot | \n", "
2 | \n", "Warren Schmidt (Nicholson) is forced to deal w... | \n", "about_schmidt | \n", "Plot | \n", "
3 | \n", "An account of screenwriter Charlie Kaufman's (... | \n", "adaptation | \n", "Plot | \n", "
4 | \n", "Ali G unwittingly becomes a pawn in the evil C... | \n", "ali_g_indahouse | \n", "Plot | \n", "
\n", " | Positive freq | \n", "Negative freq | \n", "pos_precision | \n", "pos_freq_pct | \n", "pos_hmean | \n", "
---|---|---|---|---|---|
term | \n", "\n", " | \n", " | \n", " | \n", " | \n", " |
the | \n", "2346 | \n", "2288 | \n", "0.506258 | \n", "0.048037 | \n", "0.087748 | \n", "
a | \n", "1775 | \n", "1613 | \n", "0.523908 | \n", "0.036345 | \n", "0.067975 | \n", "
and | \n", "1637 | \n", "1179 | \n", "0.581321 | \n", "0.033520 | \n", "0.063385 | \n", "
of | \n", "1480 | \n", "1235 | \n", "0.545120 | \n", "0.030305 | \n", "0.057418 | \n", "
to | \n", "942 | \n", "1010 | \n", "0.482582 | \n", "0.019289 | \n", "0.037095 | \n", "
it | \n", "826 | \n", "801 | \n", "0.507683 | \n", "0.016913 | \n", "0.032736 | \n", "
is | \n", "818 | \n", "726 | \n", "0.529793 | \n", "0.016750 | \n", "0.032473 | \n", "
s | \n", "808 | \n", "749 | \n", "0.518947 | \n", "0.016545 | \n", "0.032067 | \n", "
in | \n", "676 | \n", "622 | \n", "0.520801 | \n", "0.013842 | \n", "0.026967 | \n", "
that | \n", "617 | \n", "602 | \n", "0.506153 | \n", "0.012634 | \n", "0.024652 | \n", "
\n", " | Positive freq | \n", "Negative freq | \n", "pos_precision | \n", "pos_freq_pct | \n", "pos_hmean | \n", "pos_precision_normcdf | \n", "pos_freq_pct_normcdf | \n", "pos_scaled_f_score | \n", "
---|---|---|---|---|---|---|---|---|
term | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
best | \n", "108 | \n", "36 | \n", "0.750000 | \n", "0.002211 | \n", "0.004410 | \n", "0.719483 | \n", "0.995008 | \n", "0.835107 | \n", "
entertaining | \n", "58 | \n", "13 | \n", "0.816901 | \n", "0.001188 | \n", "0.002372 | \n", "0.770690 | \n", "0.909394 | \n", "0.834316 | \n", "
fun | \n", "73 | \n", "26 | \n", "0.737374 | \n", "0.001495 | \n", "0.002983 | \n", "0.709233 | \n", "0.956259 | \n", "0.814427 | \n", "
heart | \n", "45 | \n", "11 | \n", "0.803571 | \n", "0.000921 | \n", "0.001841 | \n", "0.760924 | \n", "0.844900 | \n", "0.800716 | \n", "
great | \n", "61 | \n", "23 | \n", "0.726190 | \n", "0.001249 | \n", "0.002494 | \n", "0.700011 | \n", "0.920936 | \n", "0.795418 | \n", "
still | \n", "63 | \n", "26 | \n", "0.707865 | \n", "0.001290 | \n", "0.002575 | \n", "0.684620 | \n", "0.927988 | \n", "0.787940 | \n", "
our | \n", "42 | \n", "11 | \n", "0.792453 | \n", "0.000860 | \n", "0.001718 | \n", "0.752608 | \n", "0.826505 | \n", "0.787827 | \n", "
performance | \n", "53 | \n", "19 | \n", "0.736111 | \n", "0.001085 | \n", "0.002167 | \n", "0.708199 | \n", "0.887454 | \n", "0.787758 | \n", "
love | \n", "61 | \n", "25 | \n", "0.709302 | \n", "0.001249 | \n", "0.002494 | \n", "0.685839 | \n", "0.920936 | \n", "0.786188 | \n", "
both | \n", "52 | \n", "19 | \n", "0.732394 | \n", "0.001065 | \n", "0.002126 | \n", "0.705143 | \n", "0.882645 | \n", "0.783972 | \n", "
\n", " | Positive freq | \n", "Negative freq | \n", "pos_precision | \n", "pos_freq_pct | \n", "pos_hmean | \n", "pos_precision_normcdf | \n", "pos_freq_pct_normcdf | \n", "pos_scaled_f_score | \n", "
---|---|---|---|---|---|---|---|---|
term | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
brawny | \n", "0 | \n", "1 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.113086 | \n", "0.459931 | \n", "0.181537 | \n", "
derivativeness | \n", "0 | \n", "1 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.113086 | \n", "0.459931 | \n", "0.181537 | \n", "
blatant | \n", "0 | \n", "1 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.113086 | \n", "0.459931 | \n", "0.181537 | \n", "
jams | \n", "0 | \n", "1 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.113086 | \n", "0.459931 | \n", "0.181537 | \n", "
staleness | \n", "0 | \n", "1 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.113086 | \n", "0.459931 | \n", "0.181537 | \n", "
luck | \n", "0 | \n", "2 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.113086 | \n", "0.459931 | \n", "0.181537 | \n", "
screenplays | \n", "0 | \n", "2 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.113086 | \n", "0.459931 | \n", "0.181537 | \n", "
tripe | \n", "0 | \n", "1 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.113086 | \n", "0.459931 | \n", "0.181537 | \n", "
lackluster | \n", "0 | \n", "6 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.113086 | \n", "0.459931 | \n", "0.181537 | \n", "
stoop | \n", "0 | \n", "1 | \n", "0.0 | \n", "0.0 | \n", "0.0 | \n", "0.113086 | \n", "0.459931 | \n", "0.181537 | \n", "
\n", " | Positive freq | \n", "Negative freq | \n", "pos_precision | \n", "pos_freq_pct | \n", "pos_hmean | \n", "pos_precision_normcdf | \n", "pos_freq_pct_normcdf | \n", "pos_scaled_f_score | \n", "neg_precision_normcdf | \n", "neg_freq_pct_normcdf | \n", "neg_scaled_f_score | \n", "scaled_f_score | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|
term | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
best | \n", "108 | \n", "36 | \n", "0.750000 | \n", "0.002211 | \n", "0.004410 | \n", "0.719483 | \n", "0.995008 | \n", "0.835107 | \n", "0.280517 | \n", "0.805491 | \n", "0.416118 | \n", "0.670214 | \n", "
entertaining | \n", "58 | \n", "13 | \n", "0.816901 | \n", "0.001188 | \n", "0.002372 | \n", "0.770690 | \n", "0.909394 | \n", "0.834316 | \n", "0.229310 | \n", "0.596336 | \n", "0.331246 | \n", "0.668633 | \n", "
fun | \n", "73 | \n", "26 | \n", "0.737374 | \n", "0.001495 | \n", "0.002983 | \n", "0.709233 | \n", "0.956259 | \n", "0.814427 | \n", "0.290767 | \n", "0.723380 | \n", "0.414801 | \n", "0.628854 | \n", "
heart | \n", "45 | \n", "11 | \n", "0.803571 | \n", "0.000921 | \n", "0.001841 | \n", "0.760924 | \n", "0.844900 | \n", "0.800716 | \n", "0.239076 | \n", "0.575415 | \n", "0.337801 | \n", "0.601433 | \n", "
great | \n", "61 | \n", "23 | \n", "0.726190 | \n", "0.001249 | \n", "0.002494 | \n", "0.700011 | \n", "0.920936 | \n", "0.795418 | \n", "0.299989 | \n", "0.695802 | \n", "0.419230 | \n", "0.590836 | \n", "
still | \n", "63 | \n", "26 | \n", "0.707865 | \n", "0.001290 | \n", "0.002575 | \n", "0.684620 | \n", "0.927988 | \n", "0.787940 | \n", "0.315380 | \n", "0.723380 | \n", "0.439254 | \n", "0.575880 | \n", "
our | \n", "42 | \n", "11 | \n", "0.792453 | \n", "0.000860 | \n", "0.001718 | \n", "0.752608 | \n", "0.826505 | \n", "0.787827 | \n", "0.247392 | \n", "0.575415 | \n", "0.346019 | \n", "0.575654 | \n", "
performance | \n", "53 | \n", "19 | \n", "0.736111 | \n", "0.001085 | \n", "0.002167 | \n", "0.708199 | \n", "0.887454 | \n", "0.787758 | \n", "0.291801 | \n", "0.657250 | \n", "0.404164 | \n", "0.575515 | \n", "
love | \n", "61 | \n", "25 | \n", "0.709302 | \n", "0.001249 | \n", "0.002494 | \n", "0.685839 | \n", "0.920936 | \n", "0.786188 | \n", "0.314161 | \n", "0.714324 | \n", "0.436395 | \n", "0.572376 | \n", "
both | \n", "52 | \n", "19 | \n", "0.732394 | \n", "0.001065 | \n", "0.002126 | \n", "0.705143 | \n", "0.882645 | \n", "0.783972 | \n", "0.294857 | \n", "0.657250 | \n", "0.407086 | \n", "0.567945 | \n", "
\n", " | Positive freq | \n", "Negative freq | \n", "pos_precision | \n", "pos_freq_pct | \n", "pos_hmean | \n", "pos_precision_normcdf | \n", "pos_freq_pct_normcdf | \n", "pos_scaled_f_score | \n", "neg_precision_normcdf | \n", "neg_freq_pct_normcdf | \n", "neg_scaled_f_score | \n", "scaled_f_score | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|
term | \n", "\n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " | \n", " |
bad | \n", "17 | \n", "105 | \n", "0.139344 | \n", "0.000348 | \n", "0.000694 | \n", "0.190130 | \n", "0.625807 | \n", "0.291652 | \n", "0.809870 | \n", "0.996676 | \n", "0.893614 | \n", "-0.787229 | \n", "
too | \n", "42 | \n", "147 | \n", "0.222222 | \n", "0.000860 | \n", "0.001713 | \n", "0.248430 | \n", "0.826505 | \n", "0.382030 | \n", "0.751570 | \n", "0.999939 | \n", "0.858145 | \n", "-0.716289 | \n", "
were | \n", "14 | \n", "50 | \n", "0.218750 | \n", "0.000287 | \n", "0.000573 | \n", "0.245811 | \n", "0.597317 | \n", "0.348291 | \n", "0.754189 | \n", "0.892009 | \n", "0.817330 | \n", "-0.634660 | \n", "
only | \n", "43 | \n", "100 | \n", "0.300699 | \n", "0.000880 | \n", "0.001756 | \n", "0.311369 | \n", "0.832785 | \n", "0.453267 | \n", "0.688631 | \n", "0.995056 | \n", "0.813959 | \n", "-0.627919 | \n", "
would | \n", "33 | \n", "72 | \n", "0.314286 | \n", "0.000676 | \n", "0.001349 | \n", "0.322931 | \n", "0.763424 | \n", "0.453872 | \n", "0.677069 | \n", "0.966222 | \n", "0.796206 | \n", "-0.592412 | \n", "
no | \n", "65 | \n", "130 | \n", "0.333333 | \n", "0.001331 | \n", "0.002651 | \n", "0.339430 | \n", "0.934547 | \n", "0.497990 | \n", "0.660570 | \n", "0.999644 | \n", "0.795481 | \n", "-0.590963 | \n", "
just | \n", "76 | \n", "145 | \n", "0.343891 | \n", "0.001556 | \n", "0.003098 | \n", "0.348713 | \n", "0.962723 | \n", "0.511979 | \n", "0.651287 | \n", "0.999924 | \n", "0.788800 | \n", "-0.577600 | \n", "
video | \n", "11 | \n", "39 | \n", "0.220000 | \n", "0.000225 | \n", "0.000450 | \n", "0.246752 | \n", "0.568300 | \n", "0.344099 | \n", "0.753248 | \n", "0.826890 | \n", "0.788353 | \n", "-0.576706 | \n", "
script | \n", "25 | \n", "57 | \n", "0.304878 | \n", "0.000512 | \n", "0.001022 | \n", "0.314906 | \n", "0.698142 | \n", "0.434035 | \n", "0.685094 | \n", "0.922954 | \n", "0.786432 | \n", "-0.572864 | \n", "
should | \n", "27 | \n", "58 | \n", "0.317647 | \n", "0.000553 | \n", "0.001104 | \n", "0.325819 | \n", "0.715199 | \n", "0.447687 | \n", "0.674181 | \n", "0.926760 | \n", "0.780546 | \n", "-0.561092 | \n", "