diff --git a/python_project_1.ipynb b/python_project_1.ipynb new file mode 100644 index 0000000..1e1f4ec --- /dev/null +++ b/python_project_1.ipynb @@ -0,0 +1,923 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 3, + "id": "7acc26cb", + "metadata": {}, + "outputs": [], + "source": [ + "import pandas as pd" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "c821dd0a", + "metadata": {}, + "outputs": [], + "source": [ + "df = pd.read_csv('https://raw.githubusercontent.com/CunyLaguardiaDataAnalytics/datasets/master/2014-15_To_2016-17_School-_Level_NYC_Regents_Report_For_All_Variables.csv')" + ] + }, + { + "cell_type": "code", + "execution_count": 71, + "id": "e080ce64", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "(212331, 15)" + ] + }, + "execution_count": 71, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.shape" + ] + }, + { + "cell_type": "code", + "execution_count": 45, + "id": "57651a37", + "metadata": { + "scrolled": true + }, + "outputs": [ + { + "data": { + "text/plain": [ + "School DBN object\n", + "School Name object\n", + "School Level object\n", + "Regents Exam object\n", + "Year int64\n", + "Total Tested int64\n", + "Mean Score object\n", + "Number Scoring Below 65 object\n", + "Percent Scoring Below 65 object\n", + "Number Scoring 65 or Above object\n", + "Percent Scoring 65 or Above object\n", + "Number Scoring 80 or Above object\n", + "Percent Scoring 80 or Above object\n", + "Number Scoring CR object\n", + "Percent Scoring CR object\n", + "dtype: object" + ] + }, + "execution_count": 45, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.dtypes" + ] + }, + { + "cell_type": "code", + "execution_count": 63, + "id": "7147a7d1", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2015 2017\n" + ] + } + ], + "source": [ + "# Time range should be 2014-2015 to 2016-2017 school year. Does the 'Year' column reflect this range?\n", + "\n", + "print(df['Year'].min(), df['Year'].max())" + ] + }, + { + "cell_type": "code", + "execution_count": 66, + "id": "897e335b", + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "School DBN 0\n", + "School Name 0\n", + "School Level 0\n", + "Regents Exam 10\n", + "Year 0\n", + "Total Tested 0\n", + "Mean Score 0\n", + "Number Scoring Below 65 0\n", + "Percent Scoring Below 65 0\n", + "Number Scoring 65 or Above 0\n", + "Percent Scoring 65 or Above 0\n", + "Number Scoring 80 or Above 0\n", + "Percent Scoring 80 or Above 0\n", + "Number Scoring CR 0\n", + "Percent Scoring CR 0\n", + "dtype: int64" + ] + }, + "execution_count": 66, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "# Is there any missing data?\n", + "\n", + "df.isna().sum()" + ] + }, + { + "cell_type": "code", + "execution_count": 79, + "id": "e0ab351b", + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + " | School DBN | \n", + "School Name | \n", + "School Level | \n", + "Regents Exam | \n", + "Year | \n", + "Total Tested | \n", + "Mean Score | \n", + "Number Scoring Below 65 | \n", + "Percent Scoring Below 65 | \n", + "Number Scoring 65 or Above | \n", + "Percent Scoring 65 or Above | \n", + "Number Scoring 80 or Above | \n", + "Percent Scoring 80 or Above | \n", + "Number Scoring CR | \n", + "Percent Scoring CR | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
18654 | \n", + "84M478 | \n", + "Inwood Academy for Leadership Charter School | \n", + "Secondary School | \n", + "NaN | \n", + "2015 | \n", + "90 | \n", + "55.6 | \n", + "61 | \n", + "67.8 | \n", + "29 | \n", + "32.2 | \n", + "6 | \n", + "6.7 | \n", + "0 | \n", + "0 | \n", + "
52756 | \n", + "84M478 | \n", + "Inwood Academy for Leadership Charter School | \n", + "Secondary School | \n", + "NaN | \n", + "2015 | \n", + "81 | \n", + "55.9 | \n", + "55 | \n", + "67.9 | \n", + "26 | \n", + "32.1 | \n", + "5 | \n", + "6.2 | \n", + "0 | \n", + "0 | \n", + "
52757 | \n", + "84M478 | \n", + "Inwood Academy for Leadership Charter School | \n", + "Secondary School | \n", + "NaN | \n", + "2015 | \n", + "9 | \n", + "53.4 | \n", + "6 | \n", + "66.7 | \n", + "3 | \n", + "33.3 | \n", + "1 | \n", + "11.1 | \n", + "0 | \n", + "0 | \n", + "
100865 | \n", + "84M478 | \n", + "Inwood Academy for Leadership Charter School | \n", + "Secondary School | \n", + "NaN | \n", + "2015 | \n", + "5 | \n", + "s | \n", + "s | \n", + "s | \n", + "s | \n", + "s | \n", + "s | \n", + "s | \n", + "na | \n", + "na | \n", + "
100866 | \n", + "84M478 | \n", + "Inwood Academy for Leadership Charter School | \n", + "Secondary School | \n", + "NaN | \n", + "2015 | \n", + "54 | \n", + "57.4 | \n", + "34 | \n", + "63 | \n", + "20 | \n", + "37 | \n", + "6 | \n", + "11.1 | \n", + "0 | \n", + "0 | \n", + "
100867 | \n", + "84M478 | \n", + "Inwood Academy for Leadership Charter School | \n", + "Secondary School | \n", + "NaN | \n", + "2015 | \n", + "31 | \n", + "s | \n", + "s | \n", + "s | \n", + "s | \n", + "s | \n", + "s | \n", + "s | \n", + "na | \n", + "na | \n", + "
138300 | \n", + "84M478 | \n", + "Inwood Academy for Leadership Charter School | \n", + "Secondary School | \n", + "NaN | \n", + "2015 | \n", + "54 | \n", + "57.3 | \n", + "34 | \n", + "63 | \n", + "20 | \n", + "37 | \n", + "5 | \n", + "9.3 | \n", + "0 | \n", + "0 | \n", + "
138301 | \n", + "84M478 | \n", + "Inwood Academy for Leadership Charter School | \n", + "Secondary School | \n", + "NaN | \n", + "2015 | \n", + "36 | \n", + "53.2 | \n", + "27 | \n", + "75 | \n", + "9 | \n", + "25 | \n", + "1 | \n", + "2.8 | \n", + "0 | \n", + "0 | \n", + "
209785 | \n", + "84M478 | \n", + "Inwood Academy for Leadership Charter School | \n", + "Secondary School | \n", + "NaN | \n", + "2015 | \n", + "12 | \n", + "59 | \n", + "9 | \n", + "75 | \n", + "3 | \n", + "25 | \n", + "1 | \n", + "8.3 | \n", + "0 | \n", + "0 | \n", + "
209786 | \n", + "84M478 | \n", + "Inwood Academy for Leadership Charter School | \n", + "Secondary School | \n", + "NaN | \n", + "2015 | \n", + "78 | \n", + "55.1 | \n", + "52 | \n", + "66.7 | \n", + "26 | \n", + "33.3 | \n", + "5 | \n", + "6.4 | \n", + "0 | \n", + "0 | \n", + "
\n", + " | School DBN | \n", + "School Name | \n", + "School Level | \n", + "Regents Exam | \n", + "Year | \n", + "Total Tested | \n", + "Mean Score | \n", + "Number Scoring Below 65 | \n", + "Percent Scoring Below 65 | \n", + "Number Scoring 65 or Above | \n", + "Percent Scoring 65 or Above | \n", + "Number Scoring 80 or Above | \n", + "Percent Scoring 80 or Above | \n", + "Number Scoring CR | \n", + "Percent Scoring CR | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
1 | \n", + "01M034 | \n", + "P.S. 034 Franklin D. Roosevelt | \n", + "K-8 | \n", + "Living Environment | \n", + "2015 | \n", + "16 | \n", + "77.9 | \n", + "1 | \n", + "6.3 | \n", + "15 | \n", + "93.8 | \n", + "7 | \n", + "43.8 | \n", + "na | \n", + "na | \n", + "
2 | \n", + "01M034 | \n", + "P.S. 034 Franklin D. Roosevelt | \n", + "K-8 | \n", + "Living Environment | \n", + "2016 | \n", + "9 | \n", + "74.0 | \n", + "1 | \n", + "11.1 | \n", + "8 | \n", + "88.9 | \n", + "2 | \n", + "22.2 | \n", + "na | \n", + "na | \n", + "
5 | \n", + "01M140 | \n", + "P.S. 140 Nathan Straus | \n", + "K-8 | \n", + "Living Environment | \n", + "2015 | \n", + "9 | \n", + "67.4 | \n", + "3 | \n", + "33.3 | \n", + "6 | \n", + "66.7 | \n", + "0 | \n", + "0.0 | \n", + "na | \n", + "na | \n", + "
6 | \n", + "01M140 | \n", + "P.S. 140 Nathan Straus | \n", + "K-8 | \n", + "Living Environment | \n", + "2016 | \n", + "15 | \n", + "72.6 | \n", + "2 | \n", + "13.3 | \n", + "13 | \n", + "86.7 | \n", + "5 | \n", + "33.3 | \n", + "na | \n", + "na | \n", + "
7 | \n", + "01M140 | \n", + "P.S. 140 Nathan Straus | \n", + "K-8 | \n", + "Living Environment | \n", + "2017 | \n", + "9 | \n", + "64.4 | \n", + "5 | \n", + "55.6 | \n", + "4 | \n", + "44.4 | \n", + "1 | \n", + "11.1 | \n", + "na | \n", + "na | \n", + "
... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "... | \n", + "
212321 | \n", + "84X717 | \n", + "Icahn Charter School | \n", + "K-8 | \n", + "Common Core Algebra | \n", + "2016 | \n", + "6 | \n", + "87.2 | \n", + "0 | \n", + "0 | \n", + "6 | \n", + "100 | \n", + "6 | \n", + "100.0 | \n", + "6 | \n", + "100 | \n", + "
212322 | \n", + "84X717 | \n", + "Icahn Charter School | \n", + "K-8 | \n", + "Common Core Algebra | \n", + "2017 | \n", + "6 | \n", + "87.0 | \n", + "0 | \n", + "0 | \n", + "6 | \n", + "100 | \n", + "6 | \n", + "100.0 | \n", + "6 | \n", + "100 | \n", + "
212323 | \n", + "84X717 | \n", + "Icahn Charter School | \n", + "K-8 | \n", + "Common Core Algebra | \n", + "2017 | \n", + "6 | \n", + "88.3 | \n", + "0 | \n", + "0 | \n", + "6 | \n", + "100 | \n", + "5 | \n", + "83.3 | \n", + "6 | \n", + "100 | \n", + "
212324 | \n", + "84X717 | \n", + "Icahn Charter School | \n", + "K-8 | \n", + "Living Environment | \n", + "2015 | \n", + "8 | \n", + "76.5 | \n", + "1 | \n", + "12.5 | \n", + "7 | \n", + "87.5 | \n", + "2 | \n", + "25.0 | \n", + "na | \n", + "na | \n", + "
212325 | \n", + "84X717 | \n", + "Icahn Charter School | \n", + "K-8 | \n", + "Living Environment | \n", + "2015 | \n", + "6 | \n", + "79.8 | \n", + "0 | \n", + "0 | \n", + "6 | \n", + "100 | \n", + "2 | \n", + "33.3 | \n", + "na | \n", + "na | \n", + "
137101 rows × 15 columns
\n", + "