Skip to content

Instantly share code, notes, and snippets.

@Randl
Last active November 23, 2023 13:04
Show Gist options
  • Save Randl/59db1a96b03fb25b13547d66933819a2 to your computer and use it in GitHub Desktop.
Save Randl/59db1a96b03fb25b13547d66933819a2 to your computer and use it in GitHub Desktop.
Display the source blob
Display the rendered blob
Raw
{
"cells": [
{
"cell_type": "code",
"execution_count": 1,
"metadata": {},
"outputs": [],
"source": [
"import pandas as pd\n",
"import numpy as np\n",
"import matplotlib.pyplot as plt"
]
},
{
"cell_type": "code",
"execution_count": 2,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"-2019.xlsx curr.xlsx sh.ipynb\r\n"
]
}
],
"source": [
"!ls"
]
},
{
"cell_type": "code",
"execution_count": 3,
"metadata": {},
"outputs": [],
"source": [
"# https://www.odata.org.il/dataset/de74c280-e91f-4771-8c23-eb8bfe885093\n",
"df = pd.read_excel(\"-2019.xlsx\", skiprows=15, usecols=list(range(8)))\n",
"df = df.drop(df.index[0])"
]
},
{
"cell_type": "code",
"execution_count": 4,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>ממוצע ציון סופי</th>\n",
" <th>מספר נבחנים</th>\n",
" <th>י\"ל</th>\n",
" <th>מחזור סיום</th>\n",
" <th>מקצוע</th>\n",
" <th>ישוב</th>\n",
" <th>שם מוסד</th>\n",
" <th>סמל מוסד</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>72.38</td>\n",
" <td>66.0</td>\n",
" <td>2.0</td>\n",
" <td>2019.0</td>\n",
" <td>אזרחות</td>\n",
" <td>אבו גוש</td>\n",
" <td>מקיף אבו גוש</td>\n",
" <td>148080.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>75.00</td>\n",
" <td>32.0</td>\n",
" <td>3.0</td>\n",
" <td>2019.0</td>\n",
" <td>אנגלית</td>\n",
" <td>אבו גוש</td>\n",
" <td>מקיף אבו גוש</td>\n",
" <td>148080.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>74.44</td>\n",
" <td>16.0</td>\n",
" <td>4.0</td>\n",
" <td>2019.0</td>\n",
" <td>אנגלית</td>\n",
" <td>אבו גוש</td>\n",
" <td>מקיף אבו גוש</td>\n",
" <td>148080.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>81.81</td>\n",
" <td>21.0</td>\n",
" <td>5.0</td>\n",
" <td>2019.0</td>\n",
" <td>אנגלית</td>\n",
" <td>אבו גוש</td>\n",
" <td>מקיף אבו גוש</td>\n",
" <td>148080.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>5</th>\n",
" <td>77.19</td>\n",
" <td>32.0</td>\n",
" <td>5.0</td>\n",
" <td>2019.0</td>\n",
" <td>ביולוגיה</td>\n",
" <td>אבו גוש</td>\n",
" <td>מקיף אבו גוש</td>\n",
" <td>148080.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>15188</th>\n",
" <td>82.67</td>\n",
" <td>12.0</td>\n",
" <td>3.0</td>\n",
" <td>2019.0</td>\n",
" <td>יהדות</td>\n",
" <td>תל אביב - יפו</td>\n",
" <td>תיכון בית יעקב תל אב</td>\n",
" <td>714857.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>15189</th>\n",
" <td>75.54</td>\n",
" <td>13.0</td>\n",
" <td>5.0</td>\n",
" <td>2019.0</td>\n",
" <td>מדע וטכנולוגיה לכל</td>\n",
" <td>תל אביב - יפו</td>\n",
" <td>תיכון בית יעקב תל אב</td>\n",
" <td>714857.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>15190</th>\n",
" <td>67.18</td>\n",
" <td>11.0</td>\n",
" <td>2.0</td>\n",
" <td>2019.0</td>\n",
" <td>ספרות</td>\n",
" <td>תל אביב - יפו</td>\n",
" <td>תיכון בית יעקב תל אב</td>\n",
" <td>714857.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>15191</th>\n",
" <td>80.33</td>\n",
" <td>12.0</td>\n",
" <td>5.0</td>\n",
" <td>2019.0</td>\n",
" <td>פסיכולוגיה התפתחותית</td>\n",
" <td>תל אביב - יפו</td>\n",
" <td>תיכון בית יעקב תל אב</td>\n",
" <td>714857.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>15192</th>\n",
" <td>81.17</td>\n",
" <td>12.0</td>\n",
" <td>3.0</td>\n",
" <td>2019.0</td>\n",
" <td>תנ'ך</td>\n",
" <td>תל אביב - יפו</td>\n",
" <td>תיכון בית יעקב תל אב</td>\n",
" <td>714857.0</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>15192 rows × 8 columns</p>\n",
"</div>"
],
"text/plain": [
" ממוצע ציון סופי מספר נבחנים י\"ל מחזור סיום מקצוע \n",
"1 72.38 66.0 2.0 2019.0 אזרחות \\\n",
"2 75.00 32.0 3.0 2019.0 אנגלית \n",
"3 74.44 16.0 4.0 2019.0 אנגלית \n",
"4 81.81 21.0 5.0 2019.0 אנגלית \n",
"5 77.19 32.0 5.0 2019.0 ביולוגיה \n",
"... ... ... ... ... ... \n",
"15188 82.67 12.0 3.0 2019.0 יהדות \n",
"15189 75.54 13.0 5.0 2019.0 מדע וטכנולוגיה לכל \n",
"15190 67.18 11.0 2.0 2019.0 ספרות \n",
"15191 80.33 12.0 5.0 2019.0 פסיכולוגיה התפתחותית \n",
"15192 81.17 12.0 3.0 2019.0 תנ'ך \n",
"\n",
" ישוב שם מוסד סמל מוסד \n",
"1 אבו גוש מקיף אבו גוש 148080.0 \n",
"2 אבו גוש מקיף אבו גוש 148080.0 \n",
"3 אבו גוש מקיף אבו גוש 148080.0 \n",
"4 אבו גוש מקיף אבו גוש 148080.0 \n",
"5 אבו גוש מקיף אבו גוש 148080.0 \n",
"... ... ... ... \n",
"15188 תל אביב - יפו תיכון בית יעקב תל אב 714857.0 \n",
"15189 תל אביב - יפו תיכון בית יעקב תל אב 714857.0 \n",
"15190 תל אביב - יפו תיכון בית יעקב תל אב 714857.0 \n",
"15191 תל אביב - יפו תיכון בית יעקב תל אב 714857.0 \n",
"15192 תל אביב - יפו תיכון בית יעקב תל אב 714857.0 \n",
"\n",
"[15192 rows x 8 columns]"
]
},
"execution_count": 4,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df"
]
},
{
"cell_type": "code",
"execution_count": 5,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>city</th>\n",
" <th>school_id</th>\n",
" <th>school_name</th>\n",
" <th>year</th>\n",
" <th>subject</th>\n",
" <th>credits</th>\n",
" <th>num_of_students</th>\n",
" <th>average</th>\n",
" <th>sum</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>אבו גוש</td>\n",
" <td>148080</td>\n",
" <td>מקיף אבו גוש</td>\n",
" <td>2019</td>\n",
" <td>אזרחות</td>\n",
" <td>2</td>\n",
" <td>66</td>\n",
" <td>72.38</td>\n",
" <td>4777.08</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>אבו גוש</td>\n",
" <td>148080</td>\n",
" <td>מקיף אבו גוש</td>\n",
" <td>2019</td>\n",
" <td>אנגלית</td>\n",
" <td>3</td>\n",
" <td>32</td>\n",
" <td>75.00</td>\n",
" <td>2400.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>אבו גוש</td>\n",
" <td>148080</td>\n",
" <td>מקיף אבו גוש</td>\n",
" <td>2019</td>\n",
" <td>אנגלית</td>\n",
" <td>4</td>\n",
" <td>16</td>\n",
" <td>74.44</td>\n",
" <td>1191.04</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>אבו גוש</td>\n",
" <td>148080</td>\n",
" <td>מקיף אבו גוש</td>\n",
" <td>2019</td>\n",
" <td>אנגלית</td>\n",
" <td>5</td>\n",
" <td>21</td>\n",
" <td>81.81</td>\n",
" <td>1718.01</td>\n",
" </tr>\n",
" <tr>\n",
" <th>5</th>\n",
" <td>אבו גוש</td>\n",
" <td>148080</td>\n",
" <td>מקיף אבו גוש</td>\n",
" <td>2019</td>\n",
" <td>ביולוגיה</td>\n",
" <td>5</td>\n",
" <td>32</td>\n",
" <td>77.19</td>\n",
" <td>2470.08</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>15188</th>\n",
" <td>תל אביב - יפו</td>\n",
" <td>714857</td>\n",
" <td>תיכון בית יעקב תל אב</td>\n",
" <td>2019</td>\n",
" <td>יהדות</td>\n",
" <td>3</td>\n",
" <td>12</td>\n",
" <td>82.67</td>\n",
" <td>992.04</td>\n",
" </tr>\n",
" <tr>\n",
" <th>15189</th>\n",
" <td>תל אביב - יפו</td>\n",
" <td>714857</td>\n",
" <td>תיכון בית יעקב תל אב</td>\n",
" <td>2019</td>\n",
" <td>מדע וטכנולוגיה לכל</td>\n",
" <td>5</td>\n",
" <td>13</td>\n",
" <td>75.54</td>\n",
" <td>982.02</td>\n",
" </tr>\n",
" <tr>\n",
" <th>15190</th>\n",
" <td>תל אביב - יפו</td>\n",
" <td>714857</td>\n",
" <td>תיכון בית יעקב תל אב</td>\n",
" <td>2019</td>\n",
" <td>ספרות</td>\n",
" <td>2</td>\n",
" <td>11</td>\n",
" <td>67.18</td>\n",
" <td>738.98</td>\n",
" </tr>\n",
" <tr>\n",
" <th>15191</th>\n",
" <td>תל אביב - יפו</td>\n",
" <td>714857</td>\n",
" <td>תיכון בית יעקב תל אב</td>\n",
" <td>2019</td>\n",
" <td>פסיכולוגיה התפתחותית</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>80.33</td>\n",
" <td>963.96</td>\n",
" </tr>\n",
" <tr>\n",
" <th>15192</th>\n",
" <td>תל אביב - יפו</td>\n",
" <td>714857</td>\n",
" <td>תיכון בית יעקב תל אב</td>\n",
" <td>2019</td>\n",
" <td>תנ'ך</td>\n",
" <td>3</td>\n",
" <td>12</td>\n",
" <td>81.17</td>\n",
" <td>974.04</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>15192 rows × 9 columns</p>\n",
"</div>"
],
"text/plain": [
" city school_id school_name year \n",
"1 אבו גוש 148080 מקיף אבו גוש 2019 \\\n",
"2 אבו גוש 148080 מקיף אבו גוש 2019 \n",
"3 אבו גוש 148080 מקיף אבו גוש 2019 \n",
"4 אבו גוש 148080 מקיף אבו גוש 2019 \n",
"5 אבו גוש 148080 מקיף אבו גוש 2019 \n",
"... ... ... ... ... \n",
"15188 תל אביב - יפו 714857 תיכון בית יעקב תל אב 2019 \n",
"15189 תל אביב - יפו 714857 תיכון בית יעקב תל אב 2019 \n",
"15190 תל אביב - יפו 714857 תיכון בית יעקב תל אב 2019 \n",
"15191 תל אביב - יפו 714857 תיכון בית יעקב תל אב 2019 \n",
"15192 תל אביב - יפו 714857 תיכון בית יעקב תל אב 2019 \n",
"\n",
" subject credits num_of_students average sum \n",
"1 אזרחות 2 66 72.38 4777.08 \n",
"2 אנגלית 3 32 75.00 2400.00 \n",
"3 אנגלית 4 16 74.44 1191.04 \n",
"4 אנגלית 5 21 81.81 1718.01 \n",
"5 ביולוגיה 5 32 77.19 2470.08 \n",
"... ... ... ... ... ... \n",
"15188 יהדות 3 12 82.67 992.04 \n",
"15189 מדע וטכנולוגיה לכל 5 13 75.54 982.02 \n",
"15190 ספרות 2 11 67.18 738.98 \n",
"15191 פסיכולוגיה התפתחותית 5 12 80.33 963.96 \n",
"15192 תנ'ך 3 12 81.17 974.04 \n",
"\n",
"[15192 rows x 9 columns]"
]
},
"execution_count": 5,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df[\"city\"] = df[\"ישוב\"].apply(lambda x: x.strip())\n",
"df[\"school_id\"] = df[\"סמל מוסד\"].astype(int)\n",
"df[\"school_name\"] = df[\"שם מוסד\"].apply(lambda x: x.strip())\n",
"df[\"year\"] = df[\"מחזור סיום\"].astype(int)\n",
"df[\"subject\"] = df[\"מקצוע\"].apply(lambda x: x.strip())\n",
"df[\"credits\"] = df['י\"ל'].astype(int)\n",
"df[\"num_of_students\"] = df[\"מספר נבחנים\"].astype(int)\n",
"df[\"average\"] = df[\"ממוצע ציון סופי\"]\n",
"df = df.drop(\n",
" [\n",
" \"ישוב\",\n",
" \"סמל מוסד\",\n",
" \"שם מוסד\",\n",
" \"מחזור סיום\",\n",
" \"מקצוע\",\n",
" 'י\"ל',\n",
" \"מספר נבחנים\",\n",
" \"ממוצע ציון סופי\",\n",
" ],\n",
" axis=1,\n",
")\n",
"df[\"sum\"] = df[\"average\"] * df[\"num_of_students\"]\n",
"df = df.dropna()\n",
"df"
]
},
{
"cell_type": "code",
"execution_count": 6,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"city 15192\n",
"school_id 15192\n",
"school_name 15192\n",
"year 15192\n",
"subject 15192\n",
"credits 15192\n",
"num_of_students 15192\n",
"average 15192\n",
"sum 15192\n",
"dtype: int64"
]
},
"execution_count": 6,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df.count()"
]
},
{
"cell_type": "code",
"execution_count": 7,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"1060"
]
},
"execution_count": 7,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"len(df.school_id.unique())"
]
},
{
"cell_type": "code",
"execution_count": 8,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"759247"
]
},
"execution_count": 8,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df.num_of_students.sum()"
]
},
{
"cell_type": "code",
"execution_count": 9,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array([2019])"
]
},
"execution_count": 9,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df.year.unique()"
]
},
{
"cell_type": "code",
"execution_count": 10,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"array(['אזרחות', 'אנגלית', 'ביולוגיה', \"הסטוריה לבי'ס ערבי\", 'כימיה',\n",
" 'מדעי לימודי הסביבה', 'מערכות תקשוב', 'מתמטיקה',\n",
" \"עברית לבי'ס ערבי\", 'ערבית לערבים', 'הבעה עברית', 'הסטוריה',\n",
" 'מחשבת ישראל וספרות', \"תושבע'פ ותלמוד\", \"תנ'ך\",\n",
" 'למודי ארץ ישראל וארכ', 'תשתיות מחשוב ותקשוב', 'חקלאות',\n",
" 'מדע וטכנולוגיה לכל', 'מחשבת ישראל לבי\"ס דת', 'ספרות', 'עצוב',\n",
" 'פסיכולוגיה התפתחותית', 'מדעי החברה', 'אלקטרוניקה ומחשבים',\n",
" 'מערכות אלקטרוניות', 'גאוגרפיה', 'מדעי המחשב',\n",
" 'מחשבת ישראל לבי\"ס כל', 'מנהל תיירותי', 'ניהול משאבי אנוש',\n",
" \"ערבית לבי'ס יהודי\", 'פיסיקה', 'תאטרון', 'תיירות', 'אמנות שימושית',\n",
" 'אמנות )הקולנוע(', 'ישומים בביוטכנולוגיה', 'מערכות ביוטכנולוגיה',\n",
" 'אומנות', 'תכנון ותכנות מערכות', 'מוסיקה', 'דת האסלם', 'ספרדית',\n",
" 'פילוסופיה', 'תקשורת )בנתיב העיוני', 'בקרת מכונות',\n",
" 'תולדות הערבים והאיסל', 'תקשורת בינלאומית )אנ', 'הפקות בתקשורת',\n",
" 'חנוך גופני', 'תקשורת וחברה', 'מחול', 'מנהל וכלכלה',\n",
" 'טכנולוגיה מוכללת', 'טכנולוגית בנייה', 'מדעי ההנדסה',\n",
" 'ניהול הייצור', 'ניהול ותפעול', 'מערכות חשמל', 'מכניקה הנדסית',\n",
" 'מערכות מכונאות רכב', 'רישומי פעילויות בחינ', 'מערכות פקוד ובקרה',\n",
" 'מדעי הים', 'ניהול מלונאי', 'שווק וקדום מכירות',\n",
" 'תחזוקת מערכות מכניות', 'מכטרוניקה', 'רוסית', \"תושבע'פ לבי'ס כללי\",\n",
" 'מדעי הבריאות', 'מערכות ניהול מידע וי', 'מערכות רפואיות',\n",
" 'אופטיקה יישומית', 'מחשבים ומערכות', 'אדריכלות ועצוב פנים',\n",
" 'צרפתית', 'מערכות תיב\"מ', 'מערכות רכב', 'תכנון הנדסי של מבנים',\n",
" 'אוטו-טק מערכות ממוחש', 'אומניות הבשול המלונא', 'מדעי התזונה',\n",
" 'עיצוב וטיפוח החן', 'עצוב אופנה', 'מערכות תעופה',\n",
" 'טלוויזיה וקולנוע', 'מדעי כדור הארץ', 'יהדות', 'חשבונאות', 'אידיש',\n",
" 'צלום', 'פרסית', 'מידע וידע באינטרנט', 'ניתוח ואיתור מידע די',\n",
" 'גרמנית', 'מדע חישובי', \"הסטוריה לבי'ס דרוזי\", 'עברית לבי\"ס דרוזי',\n",
" 'ערבית לדרוזים', 'ימאות וספינות', 'מורשת דרוזית',\n",
" 'תחזוקת מערכות סלולרי', 'אמהרית', 'איטלקית', 'מחשוב ובקרה',\n",
" 'תרמודינמיקה טכנית'], dtype=object)"
]
},
"execution_count": 10,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df.subject.unique()"
]
},
{
"cell_type": "code",
"execution_count": 11,
"metadata": {},
"outputs": [],
"source": [
"int_subjects = [\n",
" \"אזרחות\",\n",
" \"אנגלית\",\n",
" \"ביולוגיה\",\n",
" \"כימיה\",\n",
" \"מתמטיקה\",\n",
" \"פיסיקה\",\n",
" \"מדעי המחשב\",\n",
" \"גאוגרפיה\",\n",
" \"הסטוריה\",\n",
" \"חקלאות\",\n",
" \"תנ'ך\",\n",
" \"אומנות\",\n",
" \"פסיכולוגיה\",\n",
"]"
]
},
{
"cell_type": "code",
"execution_count": 12,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>city</th>\n",
" <th>school_id</th>\n",
" <th>school_name</th>\n",
" <th>year</th>\n",
" <th>subject</th>\n",
" <th>credits</th>\n",
" <th>num_of_students</th>\n",
" <th>average</th>\n",
" <th>sum</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>8156</th>\n",
" <td>פוריידיס</td>\n",
" <td>360800</td>\n",
" <td>מקיף גבעת פרדיס</td>\n",
" <td>2019</td>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>11</td>\n",
" <td>92.64</td>\n",
" <td>1019.04</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4877</th>\n",
" <td>גבעת שמואל</td>\n",
" <td>444620</td>\n",
" <td>אולפנה לבנות</td>\n",
" <td>2019</td>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>31</td>\n",
" <td>92.58</td>\n",
" <td>2869.98</td>\n",
" </tr>\n",
" <tr>\n",
" <th>526</th>\n",
" <td>מודיעין-מכבים-רעות</td>\n",
" <td>165852</td>\n",
" <td>ישיבת בנ\"ע לפיד</td>\n",
" <td>2019</td>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>43</td>\n",
" <td>92.37</td>\n",
" <td>3971.91</td>\n",
" </tr>\n",
" <tr>\n",
" <th>10658</th>\n",
" <td>עראבה</td>\n",
" <td>249284</td>\n",
" <td>מקיף אלבטוף עראבה</td>\n",
" <td>2019</td>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>40</td>\n",
" <td>91.40</td>\n",
" <td>3656.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>8031</th>\n",
" <td>מעלה עירון</td>\n",
" <td>348359</td>\n",
" <td>מקיף מושריפה</td>\n",
" <td>2019</td>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>11</td>\n",
" <td>91.27</td>\n",
" <td>1003.97</td>\n",
" </tr>\n",
" <tr>\n",
" <th>5650</th>\n",
" <td>לוד</td>\n",
" <td>441196</td>\n",
" <td>עתיד למדעים לוד</td>\n",
" <td>2019</td>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>109</td>\n",
" <td>90.67</td>\n",
" <td>9883.03</td>\n",
" </tr>\n",
" <tr>\n",
" <th>8189</th>\n",
" <td>פרדס חנה-כרכור</td>\n",
" <td>380030</td>\n",
" <td>חקלאי פרדס-חנה</td>\n",
" <td>2019</td>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>29</td>\n",
" <td>90.66</td>\n",
" <td>2629.14</td>\n",
" </tr>\n",
" <tr>\n",
" <th>614</th>\n",
" <td>מודיעין-מכבים-רעות</td>\n",
" <td>450270</td>\n",
" <td>אמי\"ת בנים מודיעין</td>\n",
" <td>2019</td>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>24</td>\n",
" <td>90.50</td>\n",
" <td>2172.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9286</th>\n",
" <td>כאוכב אבו אל-היג'א</td>\n",
" <td>372243</td>\n",
" <td>מקיף כאוכב</td>\n",
" <td>2019</td>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>13</td>\n",
" <td>90.31</td>\n",
" <td>1174.03</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9722</th>\n",
" <td>מעיליא</td>\n",
" <td>248823</td>\n",
" <td>נוטרדאם</td>\n",
" <td>2019</td>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>35</td>\n",
" <td>90.09</td>\n",
" <td>3153.15</td>\n",
" </tr>\n",
" <tr>\n",
" <th>15141</th>\n",
" <td>תל אביב - יפו</td>\n",
" <td>540476</td>\n",
" <td>ישיבת הרב עמיאל</td>\n",
" <td>2019</td>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>21</td>\n",
" <td>89.90</td>\n",
" <td>1887.90</td>\n",
" </tr>\n",
" <tr>\n",
" <th>14929</th>\n",
" <td>פתח תקווה</td>\n",
" <td>441204</td>\n",
" <td>ישיבת דרכי נעם</td>\n",
" <td>2019</td>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>17</td>\n",
" <td>89.88</td>\n",
" <td>1527.96</td>\n",
" </tr>\n",
" <tr>\n",
" <th>10318</th>\n",
" <td>סח'נין</td>\n",
" <td>248278</td>\n",
" <td>בית ספר אלבשאאר</td>\n",
" <td>2019</td>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>30</td>\n",
" <td>89.43</td>\n",
" <td>2682.90</td>\n",
" </tr>\n",
" <tr>\n",
" <th>11479</th>\n",
" <td>גדרה</td>\n",
" <td>440834</td>\n",
" <td>אולפנא בהר\"ן</td>\n",
" <td>2019</td>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>28</td>\n",
" <td>89.36</td>\n",
" <td>2502.08</td>\n",
" </tr>\n",
" <tr>\n",
" <th>7278</th>\n",
" <td>ג'ת</td>\n",
" <td>348185</td>\n",
" <td>ביה\"ס גת המשולש</td>\n",
" <td>2019</td>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>38</td>\n",
" <td>89.21</td>\n",
" <td>3389.98</td>\n",
" </tr>\n",
" <tr>\n",
" <th>8802</th>\n",
" <td>דייר אל-אסד</td>\n",
" <td>248302</td>\n",
" <td>תיכון דיר אל-אסד</td>\n",
" <td>2019</td>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>25</td>\n",
" <td>88.88</td>\n",
" <td>2222.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4862</th>\n",
" <td>גבעת שמואל</td>\n",
" <td>441634</td>\n",
" <td>ישיבת בנ\"ע ג. שמואל</td>\n",
" <td>2019</td>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>53</td>\n",
" <td>88.85</td>\n",
" <td>4709.05</td>\n",
" </tr>\n",
" <tr>\n",
" <th>11807</th>\n",
" <td>כברי</td>\n",
" <td>260240</td>\n",
" <td>כברי חט\"ע</td>\n",
" <td>2019</td>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>33</td>\n",
" <td>88.70</td>\n",
" <td>2927.10</td>\n",
" </tr>\n",
" <tr>\n",
" <th>807</th>\n",
" <td>עופרה</td>\n",
" <td>140970</td>\n",
" <td>אולפנא עופרה</td>\n",
" <td>2019</td>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>20</td>\n",
" <td>88.65</td>\n",
" <td>1773.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>12841</th>\n",
" <td>צפריה</td>\n",
" <td>440479</td>\n",
" <td>אולפנה בנ\"ע צפירה</td>\n",
" <td>2019</td>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>36</td>\n",
" <td>88.56</td>\n",
" <td>3188.16</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" city school_id school_name year subject \n",
"8156 פוריידיס 360800 מקיף גבעת פרדיס 2019 מתמטיקה \\\n",
"4877 גבעת שמואל 444620 אולפנה לבנות 2019 מתמטיקה \n",
"526 מודיעין-מכבים-רעות 165852 ישיבת בנ\"ע לפיד 2019 מתמטיקה \n",
"10658 עראבה 249284 מקיף אלבטוף עראבה 2019 מתמטיקה \n",
"8031 מעלה עירון 348359 מקיף מושריפה 2019 מתמטיקה \n",
"5650 לוד 441196 עתיד למדעים לוד 2019 מתמטיקה \n",
"8189 פרדס חנה-כרכור 380030 חקלאי פרדס-חנה 2019 מתמטיקה \n",
"614 מודיעין-מכבים-רעות 450270 אמי\"ת בנים מודיעין 2019 מתמטיקה \n",
"9286 כאוכב אבו אל-היג'א 372243 מקיף כאוכב 2019 מתמטיקה \n",
"9722 מעיליא 248823 נוטרדאם 2019 מתמטיקה \n",
"15141 תל אביב - יפו 540476 ישיבת הרב עמיאל 2019 מתמטיקה \n",
"14929 פתח תקווה 441204 ישיבת דרכי נעם 2019 מתמטיקה \n",
"10318 סח'נין 248278 בית ספר אלבשאאר 2019 מתמטיקה \n",
"11479 גדרה 440834 אולפנא בהר\"ן 2019 מתמטיקה \n",
"7278 ג'ת 348185 ביה\"ס גת המשולש 2019 מתמטיקה \n",
"8802 דייר אל-אסד 248302 תיכון דיר אל-אסד 2019 מתמטיקה \n",
"4862 גבעת שמואל 441634 ישיבת בנ\"ע ג. שמואל 2019 מתמטיקה \n",
"11807 כברי 260240 כברי חט\"ע 2019 מתמטיקה \n",
"807 עופרה 140970 אולפנא עופרה 2019 מתמטיקה \n",
"12841 צפריה 440479 אולפנה בנ\"ע צפירה 2019 מתמטיקה \n",
"\n",
" credits num_of_students average sum \n",
"8156 5 11 92.64 1019.04 \n",
"4877 5 31 92.58 2869.98 \n",
"526 5 43 92.37 3971.91 \n",
"10658 5 40 91.40 3656.00 \n",
"8031 5 11 91.27 1003.97 \n",
"5650 5 109 90.67 9883.03 \n",
"8189 5 29 90.66 2629.14 \n",
"614 5 24 90.50 2172.00 \n",
"9286 5 13 90.31 1174.03 \n",
"9722 5 35 90.09 3153.15 \n",
"15141 5 21 89.90 1887.90 \n",
"14929 5 17 89.88 1527.96 \n",
"10318 5 30 89.43 2682.90 \n",
"11479 5 28 89.36 2502.08 \n",
"7278 5 38 89.21 3389.98 \n",
"8802 5 25 88.88 2222.00 \n",
"4862 5 53 88.85 4709.05 \n",
"11807 5 33 88.70 2927.10 \n",
"807 5 20 88.65 1773.00 \n",
"12841 5 36 88.56 3188.16 "
]
},
"execution_count": 12,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"c1 = df[\"subject\"] == \"מתמטיקה\"\n",
"c2 = df[\"credits\"] == 5\n",
"df[c1 & c2].nlargest(20, \"average\")"
]
},
{
"cell_type": "code",
"execution_count": 13,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"2019 16323\n"
]
}
],
"source": [
"for y in df.year.unique():\n",
" c3 = df[\"year\"] == y\n",
" print(y, df[c1 & c2 & c3].num_of_students.sum())"
]
},
{
"cell_type": "code",
"execution_count": 14,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>city</th>\n",
" <th>school_id</th>\n",
" <th>school_name</th>\n",
" <th>year</th>\n",
" <th>subject</th>\n",
" <th>credits</th>\n",
" <th>num_of_students</th>\n",
" <th>average</th>\n",
" <th>sum</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>9290</th>\n",
" <td>כאוכב אבו אל-היג'א</td>\n",
" <td>372243</td>\n",
" <td>מקיף כאוכב</td>\n",
" <td>2019</td>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>15</td>\n",
" <td>94.47</td>\n",
" <td>1417.05</td>\n",
" </tr>\n",
" <tr>\n",
" <th>5562</th>\n",
" <td>כפר קאסם</td>\n",
" <td>448167</td>\n",
" <td>חט\"ב אבן סינא</td>\n",
" <td>2019</td>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>36</td>\n",
" <td>94.08</td>\n",
" <td>3386.88</td>\n",
" </tr>\n",
" <tr>\n",
" <th>13225</th>\n",
" <td>ירושלים</td>\n",
" <td>140061</td>\n",
" <td>תכון ליד האוניברסיטה</td>\n",
" <td>2019</td>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>29</td>\n",
" <td>93.90</td>\n",
" <td>2723.10</td>\n",
" </tr>\n",
" <tr>\n",
" <th>5964</th>\n",
" <td>קלנסווה</td>\n",
" <td>448076</td>\n",
" <td>תיכון מקיף קלנסווה</td>\n",
" <td>2019</td>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>24</td>\n",
" <td>93.83</td>\n",
" <td>2251.92</td>\n",
" </tr>\n",
" <tr>\n",
" <th>8677</th>\n",
" <td>בענה</td>\n",
" <td>248260</td>\n",
" <td>מכללת אלביאן</td>\n",
" <td>2019</td>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>11</td>\n",
" <td>93.45</td>\n",
" <td>1027.95</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3703</th>\n",
" <td>נתניה</td>\n",
" <td>470187</td>\n",
" <td>תיכון תמר אריאל</td>\n",
" <td>2019</td>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>93.33</td>\n",
" <td>1119.96</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4878</th>\n",
" <td>גבעת שמואל</td>\n",
" <td>444620</td>\n",
" <td>אולפנה לבנות</td>\n",
" <td>2019</td>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>28</td>\n",
" <td>93.32</td>\n",
" <td>2612.96</td>\n",
" </tr>\n",
" <tr>\n",
" <th>11709</th>\n",
" <td>יגור</td>\n",
" <td>360222</td>\n",
" <td>מקיף כרמל זבולון</td>\n",
" <td>2019</td>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>18</td>\n",
" <td>93.00</td>\n",
" <td>1674.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4456</th>\n",
" <td>תל אביב - יפו</td>\n",
" <td>540153</td>\n",
" <td>עירוני ה'</td>\n",
" <td>2019</td>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>20</td>\n",
" <td>92.95</td>\n",
" <td>1859.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>14930</th>\n",
" <td>פתח תקווה</td>\n",
" <td>441204</td>\n",
" <td>ישיבת דרכי נעם</td>\n",
" <td>2019</td>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>15</td>\n",
" <td>92.93</td>\n",
" <td>1393.95</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4863</th>\n",
" <td>גבעת שמואל</td>\n",
" <td>441634</td>\n",
" <td>ישיבת בנ\"ע ג. שמואל</td>\n",
" <td>2019</td>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>28</td>\n",
" <td>92.89</td>\n",
" <td>2600.92</td>\n",
" </tr>\n",
" <tr>\n",
" <th>5600</th>\n",
" <td>כפר קאסם</td>\n",
" <td>800086</td>\n",
" <td>מקיף כפר קאסם</td>\n",
" <td>2019</td>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>33</td>\n",
" <td>92.67</td>\n",
" <td>3058.11</td>\n",
" </tr>\n",
" <tr>\n",
" <th>7674</th>\n",
" <td>חיפה</td>\n",
" <td>340216</td>\n",
" <td>הריאלי העברי חיפה</td>\n",
" <td>2019</td>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>115</td>\n",
" <td>92.46</td>\n",
" <td>10632.90</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4303</th>\n",
" <td>תל אביב - יפו</td>\n",
" <td>515502</td>\n",
" <td>תיכונ\"ט ע\"ש אלתרמן</td>\n",
" <td>2019</td>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>50</td>\n",
" <td>92.32</td>\n",
" <td>4616.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>13568</th>\n",
" <td>ירושלים</td>\n",
" <td>144097</td>\n",
" <td>התיכון הישראלי למדעי</td>\n",
" <td>2019</td>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>23</td>\n",
" <td>92.30</td>\n",
" <td>2122.90</td>\n",
" </tr>\n",
" <tr>\n",
" <th>602</th>\n",
" <td>מודיעין-מכבים-רעות</td>\n",
" <td>442780</td>\n",
" <td>אמי\"ת בנות מודיעין</td>\n",
" <td>2019</td>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>12</td>\n",
" <td>92.25</td>\n",
" <td>1107.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>5500</th>\n",
" <td>כפר סבא</td>\n",
" <td>444117</td>\n",
" <td>תיכון ע\"ש חיים הרצוג</td>\n",
" <td>2019</td>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>30</td>\n",
" <td>92.20</td>\n",
" <td>2766.00</td>\n",
" </tr>\n",
" <tr>\n",
" <th>10116</th>\n",
" <td>נצרת</td>\n",
" <td>247056</td>\n",
" <td>נזירות סנט גוזף</td>\n",
" <td>2019</td>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>40</td>\n",
" <td>92.17</td>\n",
" <td>3686.80</td>\n",
" </tr>\n",
" <tr>\n",
" <th>5078</th>\n",
" <td>הוד השרון</td>\n",
" <td>441410</td>\n",
" <td>תיכון ע\"ש אילן רמון</td>\n",
" <td>2019</td>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>45</td>\n",
" <td>92.13</td>\n",
" <td>4145.85</td>\n",
" </tr>\n",
" <tr>\n",
" <th>440</th>\n",
" <td>מודיעין-מכבים-רעות</td>\n",
" <td>144675</td>\n",
" <td>ע\"ש יצחק רבין עי\"ס</td>\n",
" <td>2019</td>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>23</td>\n",
" <td>92.04</td>\n",
" <td>2116.92</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" city school_id school_name year subject \n",
"9290 כאוכב אבו אל-היג'א 372243 מקיף כאוכב 2019 פיסיקה \\\n",
"5562 כפר קאסם 448167 חט\"ב אבן סינא 2019 פיסיקה \n",
"13225 ירושלים 140061 תכון ליד האוניברסיטה 2019 פיסיקה \n",
"5964 קלנסווה 448076 תיכון מקיף קלנסווה 2019 פיסיקה \n",
"8677 בענה 248260 מכללת אלביאן 2019 פיסיקה \n",
"3703 נתניה 470187 תיכון תמר אריאל 2019 פיסיקה \n",
"4878 גבעת שמואל 444620 אולפנה לבנות 2019 פיסיקה \n",
"11709 יגור 360222 מקיף כרמל זבולון 2019 פיסיקה \n",
"4456 תל אביב - יפו 540153 עירוני ה' 2019 פיסיקה \n",
"14930 פתח תקווה 441204 ישיבת דרכי נעם 2019 פיסיקה \n",
"4863 גבעת שמואל 441634 ישיבת בנ\"ע ג. שמואל 2019 פיסיקה \n",
"5600 כפר קאסם 800086 מקיף כפר קאסם 2019 פיסיקה \n",
"7674 חיפה 340216 הריאלי העברי חיפה 2019 פיסיקה \n",
"4303 תל אביב - יפו 515502 תיכונ\"ט ע\"ש אלתרמן 2019 פיסיקה \n",
"13568 ירושלים 144097 התיכון הישראלי למדעי 2019 פיסיקה \n",
"602 מודיעין-מכבים-רעות 442780 אמי\"ת בנות מודיעין 2019 פיסיקה \n",
"5500 כפר סבא 444117 תיכון ע\"ש חיים הרצוג 2019 פיסיקה \n",
"10116 נצרת 247056 נזירות סנט גוזף 2019 פיסיקה \n",
"5078 הוד השרון 441410 תיכון ע\"ש אילן רמון 2019 פיסיקה \n",
"440 מודיעין-מכבים-רעות 144675 ע\"ש יצחק רבין עי\"ס 2019 פיסיקה \n",
"\n",
" credits num_of_students average sum \n",
"9290 5 15 94.47 1417.05 \n",
"5562 5 36 94.08 3386.88 \n",
"13225 5 29 93.90 2723.10 \n",
"5964 5 24 93.83 2251.92 \n",
"8677 5 11 93.45 1027.95 \n",
"3703 5 12 93.33 1119.96 \n",
"4878 5 28 93.32 2612.96 \n",
"11709 5 18 93.00 1674.00 \n",
"4456 5 20 92.95 1859.00 \n",
"14930 5 15 92.93 1393.95 \n",
"4863 5 28 92.89 2600.92 \n",
"5600 5 33 92.67 3058.11 \n",
"7674 5 115 92.46 10632.90 \n",
"4303 5 50 92.32 4616.00 \n",
"13568 5 23 92.30 2122.90 \n",
"602 5 12 92.25 1107.00 \n",
"5500 5 30 92.20 2766.00 \n",
"10116 5 40 92.17 3686.80 \n",
"5078 5 45 92.13 4145.85 \n",
"440 5 23 92.04 2116.92 "
]
},
"execution_count": 14,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"c1 = df[\"subject\"] == \"פיסיקה\"\n",
"df[c1 & c2].nlargest(20, \"average\")"
]
},
{
"cell_type": "code",
"execution_count": 15,
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"2019 11344\n"
]
}
],
"source": [
"for y in df.year.unique():\n",
" c3 = df[\"year\"] == y\n",
" print(y, df[c1 & c2 & c3].num_of_students.sum())"
]
},
{
"cell_type": "code",
"execution_count": 16,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>city</th>\n",
" <th>school_id</th>\n",
" <th>school_name</th>\n",
" <th>year</th>\n",
" <th>subject</th>\n",
" <th>credits</th>\n",
" <th>num_of_students</th>\n",
" <th>average</th>\n",
" <th>sum</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>7274</th>\n",
" <td>ג'ת</td>\n",
" <td>348185</td>\n",
" <td>ביה\"ס גת המשולש</td>\n",
" <td>2019</td>\n",
" <td>מערכות אלקטרוניות</td>\n",
" <td>5</td>\n",
" <td>36</td>\n",
" <td>100.0</td>\n",
" <td>3600.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>6899</th>\n",
" <td>תל מונד</td>\n",
" <td>441279</td>\n",
" <td>בית חינוך ע\"ש רבין</td>\n",
" <td>2019</td>\n",
" <td>טכנולוגיה מוכללת</td>\n",
" <td>5</td>\n",
" <td>33</td>\n",
" <td>100.0</td>\n",
" <td>3300.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>7173</th>\n",
" <td>באקה אל-גרביה</td>\n",
" <td>348342</td>\n",
" <td>עי\"ס אלקאסמי</td>\n",
" <td>2019</td>\n",
" <td>מערכות אלקטרוניות</td>\n",
" <td>5</td>\n",
" <td>31</td>\n",
" <td>100.0</td>\n",
" <td>3100.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>10324</th>\n",
" <td>סח'נין</td>\n",
" <td>248278</td>\n",
" <td>בית ספר אלבשאאר</td>\n",
" <td>2019</td>\n",
" <td>תכנון ותכנות מערכות</td>\n",
" <td>5</td>\n",
" <td>27</td>\n",
" <td>100.0</td>\n",
" <td>2700.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>10117</th>\n",
" <td>נצרת</td>\n",
" <td>247056</td>\n",
" <td>נזירות סנט גוזף</td>\n",
" <td>2019</td>\n",
" <td>תכנון ותכנות מערכות</td>\n",
" <td>5</td>\n",
" <td>25</td>\n",
" <td>100.0</td>\n",
" <td>2500.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>13015</th>\n",
" <td>רמת השרון</td>\n",
" <td>580019</td>\n",
" <td>חקלאי הכפר הירוק</td>\n",
" <td>2019</td>\n",
" <td>מערכות אלקטרוניות</td>\n",
" <td>5</td>\n",
" <td>17</td>\n",
" <td>100.0</td>\n",
" <td>1700.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4084</th>\n",
" <td>רמת גן</td>\n",
" <td>540211</td>\n",
" <td>עירוני ע\"ש בליך</td>\n",
" <td>2019</td>\n",
" <td>מחול</td>\n",
" <td>5</td>\n",
" <td>11</td>\n",
" <td>100.0</td>\n",
" <td>1100.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>6779</th>\n",
" <td>רעננה</td>\n",
" <td>441808</td>\n",
" <td>תיכון אביב</td>\n",
" <td>2019</td>\n",
" <td>תכנון ותכנות מערכות</td>\n",
" <td>5</td>\n",
" <td>11</td>\n",
" <td>100.0</td>\n",
" <td>1100.0</td>\n",
" </tr>\n",
" <tr>\n",
" <th>14326</th>\n",
" <td>ביתר עילית</td>\n",
" <td>722066</td>\n",
" <td>סמינר מורשת ירושלים</td>\n",
" <td>2019</td>\n",
" <td>רישומי פעילויות בחינ</td>\n",
" <td>3</td>\n",
" <td>11</td>\n",
" <td>100.0</td>\n",
" <td>1100.0</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" city school_id school_name year \n",
"7274 ג'ת 348185 ביה\"ס גת המשולש 2019 \\\n",
"6899 תל מונד 441279 בית חינוך ע\"ש רבין 2019 \n",
"7173 באקה אל-גרביה 348342 עי\"ס אלקאסמי 2019 \n",
"10324 סח'נין 248278 בית ספר אלבשאאר 2019 \n",
"10117 נצרת 247056 נזירות סנט גוזף 2019 \n",
"13015 רמת השרון 580019 חקלאי הכפר הירוק 2019 \n",
"4084 רמת גן 540211 עירוני ע\"ש בליך 2019 \n",
"6779 רעננה 441808 תיכון אביב 2019 \n",
"14326 ביתר עילית 722066 סמינר מורשת ירושלים 2019 \n",
"\n",
" subject credits num_of_students average sum \n",
"7274 מערכות אלקטרוניות 5 36 100.0 3600.0 \n",
"6899 טכנולוגיה מוכללת 5 33 100.0 3300.0 \n",
"7173 מערכות אלקטרוניות 5 31 100.0 3100.0 \n",
"10324 תכנון ותכנות מערכות 5 27 100.0 2700.0 \n",
"10117 תכנון ותכנות מערכות 5 25 100.0 2500.0 \n",
"13015 מערכות אלקטרוניות 5 17 100.0 1700.0 \n",
"4084 מחול 5 11 100.0 1100.0 \n",
"6779 תכנון ותכנות מערכות 5 11 100.0 1100.0 \n",
"14326 רישומי פעילויות בחינ 3 11 100.0 1100.0 "
]
},
"execution_count": 16,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df[df[\"average\"] == 100].sort_values(by=[\"num_of_students\"], ascending=False)"
]
},
{
"cell_type": "code",
"execution_count": 17,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"city 77\n",
"school_id 77\n",
"school_name 77\n",
"year 77\n",
"subject 77\n",
"credits 77\n",
"num_of_students 77\n",
"average 77\n",
"sum 77\n",
"dtype: int64"
]
},
"execution_count": 17,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df[df[\"average\"] < 56].count()"
]
},
{
"cell_type": "code",
"execution_count": 18,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>subject</th>\n",
" <th>credits</th>\n",
" <th>num_of_students</th>\n",
" <th>average</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>122</th>\n",
" <td>מערכות תעופה</td>\n",
" <td>3</td>\n",
" <td>28</td>\n",
" <td>60.820000</td>\n",
" </tr>\n",
" <tr>\n",
" <th>140</th>\n",
" <td>עברית לבי\"ס דרוזי</td>\n",
" <td>3</td>\n",
" <td>1213</td>\n",
" <td>61.006892</td>\n",
" </tr>\n",
" <tr>\n",
" <th>84</th>\n",
" <td>מערכות מכונאות רכב</td>\n",
" <td>3</td>\n",
" <td>161</td>\n",
" <td>63.757826</td>\n",
" </tr>\n",
" <tr>\n",
" <th>110</th>\n",
" <td>מערכות רכב</td>\n",
" <td>3</td>\n",
" <td>43</td>\n",
" <td>64.580930</td>\n",
" </tr>\n",
" <tr>\n",
" <th>118</th>\n",
" <td>מדעי התזונה</td>\n",
" <td>5</td>\n",
" <td>83</td>\n",
" <td>66.506024</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>104</th>\n",
" <td>מחשבים ומערכות</td>\n",
" <td>5</td>\n",
" <td>143</td>\n",
" <td>93.888531</td>\n",
" </tr>\n",
" <tr>\n",
" <th>149</th>\n",
" <td>מחשוב ובקרה</td>\n",
" <td>5</td>\n",
" <td>62</td>\n",
" <td>93.934839</td>\n",
" </tr>\n",
" <tr>\n",
" <th>61</th>\n",
" <td>תכנון ותכנות מערכות</td>\n",
" <td>5</td>\n",
" <td>4413</td>\n",
" <td>94.551634</td>\n",
" </tr>\n",
" <tr>\n",
" <th>74</th>\n",
" <td>מחול</td>\n",
" <td>5</td>\n",
" <td>311</td>\n",
" <td>95.716720</td>\n",
" </tr>\n",
" <tr>\n",
" <th>148</th>\n",
" <td>איטלקית</td>\n",
" <td>5</td>\n",
" <td>14</td>\n",
" <td>99.290000</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>151 rows × 4 columns</p>\n",
"</div>"
],
"text/plain": [
" subject credits num_of_students average\n",
"122 מערכות תעופה 3 28 60.820000\n",
"140 עברית לבי\"ס דרוזי 3 1213 61.006892\n",
"84 מערכות מכונאות רכב 3 161 63.757826\n",
"110 מערכות רכב 3 43 64.580930\n",
"118 מדעי התזונה 5 83 66.506024\n",
".. ... ... ... ...\n",
"104 מחשבים ומערכות 5 143 93.888531\n",
"149 מחשוב ובקרה 5 62 93.934839\n",
"61 תכנון ותכנות מערכות 5 4413 94.551634\n",
"74 מחול 5 311 95.716720\n",
"148 איטלקית 5 14 99.290000\n",
"\n",
"[151 rows x 4 columns]"
]
},
"execution_count": 18,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df_dict = {\"subject\": [], \"credits\": [], \"num_of_students\": [], \"average\": []}\n",
"for sub in df.subject.unique():\n",
" c1 = df[\"subject\"] == sub\n",
" for cr in sorted(df.loc[c1, \"credits\"].unique()):\n",
" c2 = df[\"credits\"] == cr\n",
" tot = float(df.loc[c1 & c2, \"sum\"].sum())\n",
" st = int(df.loc[c1 & c2, \"num_of_students\"].sum())\n",
"\n",
" df_dict[\"subject\"].append(sub)\n",
" df_dict[\"credits\"].append(cr)\n",
" df_dict[\"num_of_students\"].append(st)\n",
" df_dict[\"average\"].append(tot / st)\n",
"\n",
"df_subjects = pd.DataFrame(df_dict)\n",
"df_subjects = df_subjects[df_subjects[\"average\"] > 0].sort_values(by=[\"average\"])\n",
"df_subjects[\"num_of_students\"] = df_subjects[\"num_of_students\"].astype(int)\n",
"df_subjects"
]
},
{
"cell_type": "code",
"execution_count": 19,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>subject</th>\n",
" <th>credits</th>\n",
" <th>num_of_students</th>\n",
" <th>average</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>אזרחות</td>\n",
" <td>2</td>\n",
" <td>90225</td>\n",
" <td>74.539032</td>\n",
" </tr>\n",
" <tr>\n",
" <th>21</th>\n",
" <td>הבעה עברית</td>\n",
" <td>2</td>\n",
" <td>68930</td>\n",
" <td>75.284605</td>\n",
" </tr>\n",
" <tr>\n",
" <th>22</th>\n",
" <td>הסטוריה</td>\n",
" <td>2</td>\n",
" <td>68014</td>\n",
" <td>77.931136</td>\n",
" </tr>\n",
" <tr>\n",
" <th>36</th>\n",
" <td>ספרות</td>\n",
" <td>2</td>\n",
" <td>53268</td>\n",
" <td>77.328742</td>\n",
" </tr>\n",
" <tr>\n",
" <th>27</th>\n",
" <td>תנ'ך</td>\n",
" <td>2</td>\n",
" <td>50240</td>\n",
" <td>78.425645</td>\n",
" </tr>\n",
" <tr>\n",
" <th>14</th>\n",
" <td>מתמטיקה</td>\n",
" <td>3</td>\n",
" <td>47043</td>\n",
" <td>77.158361</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>אנגלית</td>\n",
" <td>5</td>\n",
" <td>45869</td>\n",
" <td>87.609294</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>אנגלית</td>\n",
" <td>4</td>\n",
" <td>28004</td>\n",
" <td>77.512400</td>\n",
" </tr>\n",
" <tr>\n",
" <th>7</th>\n",
" <td>הסטוריה לבי'ס ערבי</td>\n",
" <td>2</td>\n",
" <td>20411</td>\n",
" <td>84.703571</td>\n",
" </tr>\n",
" <tr>\n",
" <th>15</th>\n",
" <td>מתמטיקה</td>\n",
" <td>4</td>\n",
" <td>20308</td>\n",
" <td>81.188945</td>\n",
" </tr>\n",
" <tr>\n",
" <th>19</th>\n",
" <td>ערבית לערבים</td>\n",
" <td>3</td>\n",
" <td>18046</td>\n",
" <td>74.953832</td>\n",
" </tr>\n",
" <tr>\n",
" <th>6</th>\n",
" <td>ביולוגיה</td>\n",
" <td>5</td>\n",
" <td>17443</td>\n",
" <td>79.553223</td>\n",
" </tr>\n",
" <tr>\n",
" <th>16</th>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>16323</td>\n",
" <td>81.697470</td>\n",
" </tr>\n",
" <tr>\n",
" <th>17</th>\n",
" <td>עברית לבי'ס ערבי</td>\n",
" <td>3</td>\n",
" <td>15124</td>\n",
" <td>69.769589</td>\n",
" </tr>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>אנגלית</td>\n",
" <td>3</td>\n",
" <td>14650</td>\n",
" <td>73.856224</td>\n",
" </tr>\n",
" <tr>\n",
" <th>52</th>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>11344</td>\n",
" <td>85.682271</td>\n",
" </tr>\n",
" <tr>\n",
" <th>24</th>\n",
" <td>מחשבת ישראל וספרות</td>\n",
" <td>2</td>\n",
" <td>11278</td>\n",
" <td>81.830137</td>\n",
" </tr>\n",
" <tr>\n",
" <th>29</th>\n",
" <td>תנ'ך</td>\n",
" <td>5</td>\n",
" <td>9810</td>\n",
" <td>83.693271</td>\n",
" </tr>\n",
" <tr>\n",
" <th>10</th>\n",
" <td>כימיה</td>\n",
" <td>5</td>\n",
" <td>9634</td>\n",
" <td>81.825381</td>\n",
" </tr>\n",
" <tr>\n",
" <th>26</th>\n",
" <td>תושבע'פ ותלמוד</td>\n",
" <td>5</td>\n",
" <td>9579</td>\n",
" <td>81.523992</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" subject credits num_of_students average\n",
"0 אזרחות 2 90225 74.539032\n",
"21 הבעה עברית 2 68930 75.284605\n",
"22 הסטוריה 2 68014 77.931136\n",
"36 ספרות 2 53268 77.328742\n",
"27 תנ'ך 2 50240 78.425645\n",
"14 מתמטיקה 3 47043 77.158361\n",
"4 אנגלית 5 45869 87.609294\n",
"3 אנגלית 4 28004 77.512400\n",
"7 הסטוריה לבי'ס ערבי 2 20411 84.703571\n",
"15 מתמטיקה 4 20308 81.188945\n",
"19 ערבית לערבים 3 18046 74.953832\n",
"6 ביולוגיה 5 17443 79.553223\n",
"16 מתמטיקה 5 16323 81.697470\n",
"17 עברית לבי'ס ערבי 3 15124 69.769589\n",
"2 אנגלית 3 14650 73.856224\n",
"52 פיסיקה 5 11344 85.682271\n",
"24 מחשבת ישראל וספרות 2 11278 81.830137\n",
"29 תנ'ך 5 9810 83.693271\n",
"10 כימיה 5 9634 81.825381\n",
"26 תושבע'פ ותלמוד 5 9579 81.523992"
]
},
"execution_count": 19,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df_subjects.nlargest(20, \"num_of_students\")"
]
},
{
"cell_type": "code",
"execution_count": 20,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>subject</th>\n",
" <th>credits</th>\n",
" <th>num_of_students</th>\n",
" <th>average</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>2</th>\n",
" <td>אנגלית</td>\n",
" <td>3</td>\n",
" <td>14650</td>\n",
" <td>73.856224</td>\n",
" </tr>\n",
" <tr>\n",
" <th>0</th>\n",
" <td>אזרחות</td>\n",
" <td>2</td>\n",
" <td>90225</td>\n",
" <td>74.539032</td>\n",
" </tr>\n",
" <tr>\n",
" <th>45</th>\n",
" <td>גאוגרפיה</td>\n",
" <td>5</td>\n",
" <td>5606</td>\n",
" <td>75.351561</td>\n",
" </tr>\n",
" <tr>\n",
" <th>14</th>\n",
" <td>מתמטיקה</td>\n",
" <td>3</td>\n",
" <td>47043</td>\n",
" <td>77.158361</td>\n",
" </tr>\n",
" <tr>\n",
" <th>3</th>\n",
" <td>אנגלית</td>\n",
" <td>4</td>\n",
" <td>28004</td>\n",
" <td>77.512400</td>\n",
" </tr>\n",
" <tr>\n",
" <th>22</th>\n",
" <td>הסטוריה</td>\n",
" <td>2</td>\n",
" <td>68014</td>\n",
" <td>77.931136</td>\n",
" </tr>\n",
" <tr>\n",
" <th>27</th>\n",
" <td>תנ'ך</td>\n",
" <td>2</td>\n",
" <td>50240</td>\n",
" <td>78.425645</td>\n",
" </tr>\n",
" <tr>\n",
" <th>6</th>\n",
" <td>ביולוגיה</td>\n",
" <td>5</td>\n",
" <td>17443</td>\n",
" <td>79.553223</td>\n",
" </tr>\n",
" <tr>\n",
" <th>9</th>\n",
" <td>כימיה</td>\n",
" <td>3</td>\n",
" <td>26</td>\n",
" <td>79.620000</td>\n",
" </tr>\n",
" <tr>\n",
" <th>28</th>\n",
" <td>תנ'ך</td>\n",
" <td>3</td>\n",
" <td>7526</td>\n",
" <td>79.867222</td>\n",
" </tr>\n",
" <tr>\n",
" <th>33</th>\n",
" <td>חקלאות</td>\n",
" <td>5</td>\n",
" <td>1932</td>\n",
" <td>81.096599</td>\n",
" </tr>\n",
" <tr>\n",
" <th>15</th>\n",
" <td>מתמטיקה</td>\n",
" <td>4</td>\n",
" <td>20308</td>\n",
" <td>81.188945</td>\n",
" </tr>\n",
" <tr>\n",
" <th>16</th>\n",
" <td>מתמטיקה</td>\n",
" <td>5</td>\n",
" <td>16323</td>\n",
" <td>81.697470</td>\n",
" </tr>\n",
" <tr>\n",
" <th>10</th>\n",
" <td>כימיה</td>\n",
" <td>5</td>\n",
" <td>9634</td>\n",
" <td>81.825381</td>\n",
" </tr>\n",
" <tr>\n",
" <th>5</th>\n",
" <td>ביולוגיה</td>\n",
" <td>3</td>\n",
" <td>13</td>\n",
" <td>83.000000</td>\n",
" </tr>\n",
" <tr>\n",
" <th>29</th>\n",
" <td>תנ'ך</td>\n",
" <td>5</td>\n",
" <td>9810</td>\n",
" <td>83.693271</td>\n",
" </tr>\n",
" <tr>\n",
" <th>1</th>\n",
" <td>אזרחות</td>\n",
" <td>5</td>\n",
" <td>368</td>\n",
" <td>84.531223</td>\n",
" </tr>\n",
" <tr>\n",
" <th>23</th>\n",
" <td>הסטוריה</td>\n",
" <td>5</td>\n",
" <td>570</td>\n",
" <td>84.853035</td>\n",
" </tr>\n",
" <tr>\n",
" <th>52</th>\n",
" <td>פיסיקה</td>\n",
" <td>5</td>\n",
" <td>11344</td>\n",
" <td>85.682271</td>\n",
" </tr>\n",
" <tr>\n",
" <th>46</th>\n",
" <td>מדעי המחשב</td>\n",
" <td>5</td>\n",
" <td>7838</td>\n",
" <td>86.369865</td>\n",
" </tr>\n",
" <tr>\n",
" <th>60</th>\n",
" <td>אומנות</td>\n",
" <td>5</td>\n",
" <td>642</td>\n",
" <td>86.867508</td>\n",
" </tr>\n",
" <tr>\n",
" <th>4</th>\n",
" <td>אנגלית</td>\n",
" <td>5</td>\n",
" <td>45869</td>\n",
" <td>87.609294</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"</div>"
],
"text/plain": [
" subject credits num_of_students average\n",
"2 אנגלית 3 14650 73.856224\n",
"0 אזרחות 2 90225 74.539032\n",
"45 גאוגרפיה 5 5606 75.351561\n",
"14 מתמטיקה 3 47043 77.158361\n",
"3 אנגלית 4 28004 77.512400\n",
"22 הסטוריה 2 68014 77.931136\n",
"27 תנ'ך 2 50240 78.425645\n",
"6 ביולוגיה 5 17443 79.553223\n",
"9 כימיה 3 26 79.620000\n",
"28 תנ'ך 3 7526 79.867222\n",
"33 חקלאות 5 1932 81.096599\n",
"15 מתמטיקה 4 20308 81.188945\n",
"16 מתמטיקה 5 16323 81.697470\n",
"10 כימיה 5 9634 81.825381\n",
"5 ביולוגיה 3 13 83.000000\n",
"29 תנ'ך 5 9810 83.693271\n",
"1 אזרחות 5 368 84.531223\n",
"23 הסטוריה 5 570 84.853035\n",
"52 פיסיקה 5 11344 85.682271\n",
"46 מדעי המחשב 5 7838 86.369865\n",
"60 אומנות 5 642 86.867508\n",
"4 אנגלית 5 45869 87.609294"
]
},
"execution_count": 20,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df_subjects[df_subjects[\"subject\"].isin(int_subjects)]"
]
},
{
"cell_type": "code",
"execution_count": 21,
"metadata": {},
"outputs": [
{
"data": {
"text/html": [
"<div>\n",
"<style scoped>\n",
" .dataframe tbody tr th:only-of-type {\n",
" vertical-align: middle;\n",
" }\n",
"\n",
" .dataframe tbody tr th {\n",
" vertical-align: top;\n",
" }\n",
"\n",
" .dataframe thead th {\n",
" text-align: right;\n",
" }\n",
"</style>\n",
"<table border=\"1\" class=\"dataframe\">\n",
" <thead>\n",
" <tr style=\"text-align: right;\">\n",
" <th></th>\n",
" <th>subject</th>\n",
" <th>credits</th>\n",
" <th>num_of_students</th>\n",
" <th>average</th>\n",
" </tr>\n",
" </thead>\n",
" <tbody>\n",
" <tr>\n",
" <th>118</th>\n",
" <td>מדעי התזונה</td>\n",
" <td>5</td>\n",
" <td>83</td>\n",
" <td>66.506024</td>\n",
" </tr>\n",
" <tr>\n",
" <th>85</th>\n",
" <td>מערכות מכונאות רכב</td>\n",
" <td>5</td>\n",
" <td>69</td>\n",
" <td>69.854783</td>\n",
" </tr>\n",
" <tr>\n",
" <th>54</th>\n",
" <td>תיירות</td>\n",
" <td>5</td>\n",
" <td>608</td>\n",
" <td>69.924720</td>\n",
" </tr>\n",
" <tr>\n",
" <th>82</th>\n",
" <td>מערכות חשמל</td>\n",
" <td>5</td>\n",
" <td>932</td>\n",
" <td>70.149989</td>\n",
" </tr>\n",
" <tr>\n",
" <th>117</th>\n",
" <td>אומניות הבשול המלונא</td>\n",
" <td>5</td>\n",
" <td>82</td>\n",
" <td>72.572805</td>\n",
" </tr>\n",
" <tr>\n",
" <th>...</th>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" <td>...</td>\n",
" </tr>\n",
" <tr>\n",
" <th>104</th>\n",
" <td>מחשבים ומערכות</td>\n",
" <td>5</td>\n",
" <td>143</td>\n",
" <td>93.888531</td>\n",
" </tr>\n",
" <tr>\n",
" <th>149</th>\n",
" <td>מחשוב ובקרה</td>\n",
" <td>5</td>\n",
" <td>62</td>\n",
" <td>93.934839</td>\n",
" </tr>\n",
" <tr>\n",
" <th>61</th>\n",
" <td>תכנון ותכנות מערכות</td>\n",
" <td>5</td>\n",
" <td>4413</td>\n",
" <td>94.551634</td>\n",
" </tr>\n",
" <tr>\n",
" <th>74</th>\n",
" <td>מחול</td>\n",
" <td>5</td>\n",
" <td>311</td>\n",
" <td>95.716720</td>\n",
" </tr>\n",
" <tr>\n",
" <th>148</th>\n",
" <td>איטלקית</td>\n",
" <td>5</td>\n",
" <td>14</td>\n",
" <td>99.290000</td>\n",
" </tr>\n",
" </tbody>\n",
"</table>\n",
"<p>103 rows × 4 columns</p>\n",
"</div>"
],
"text/plain": [
" subject credits num_of_students average\n",
"118 מדעי התזונה 5 83 66.506024\n",
"85 מערכות מכונאות רכב 5 69 69.854783\n",
"54 תיירות 5 608 69.924720\n",
"82 מערכות חשמל 5 932 70.149989\n",
"117 אומניות הבשול המלונא 5 82 72.572805\n",
".. ... ... ... ...\n",
"104 מחשבים ומערכות 5 143 93.888531\n",
"149 מחשוב ובקרה 5 62 93.934839\n",
"61 תכנון ותכנות מערכות 5 4413 94.551634\n",
"74 מחול 5 311 95.716720\n",
"148 איטלקית 5 14 99.290000\n",
"\n",
"[103 rows x 4 columns]"
]
},
"execution_count": 21,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df_subjects[df_subjects[\"credits\"] == 5]"
]
},
{
"cell_type": "code",
"execution_count": 22,
"metadata": {},
"outputs": [
{
"data": {
"image/png": "\n",
"text/plain": [
"<Figure size 640x480 with 1 Axes>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"df[\"average\"].plot.hist(bins=int(df[\"average\"].max() - df[\"average\"].min()))\n",
"plt.grid()\n",
"plt.show()"
]
},
{
"cell_type": "code",
"execution_count": 23,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"79.83"
]
},
"execution_count": 23,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df[\"average\"].median()"
]
},
{
"cell_type": "code",
"execution_count": 24,
"metadata": {},
"outputs": [
{
"data": {
"image/png": "\n",
"text/plain": [
"<Figure size 640x480 with 1 Axes>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"df[\"num_of_students\"].plot.hist(bins=150)\n",
"plt.grid()\n",
"plt.show()"
]
},
{
"cell_type": "code",
"execution_count": 25,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"28.0"
]
},
"execution_count": 25,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df[\"num_of_students\"].median()"
]
},
{
"cell_type": "code",
"execution_count": 26,
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"498"
]
},
"execution_count": 26,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"df[\"num_of_students\"].max()"
]
},
{
"cell_type": "code",
"execution_count": 27,
"metadata": {},
"outputs": [
{
"data": {
"image/png": "\n",
"text/plain": [
"<Figure size 640x480 with 1 Axes>"
]
},
"metadata": {},
"output_type": "display_data"
}
],
"source": [
"df_subjects[\"average\"].plot.hist(\n",
" bins=int(df_subjects[\"average\"].max() - df_subjects[\"average\"].min())\n",
")\n",
"plt.grid()\n",
"plt.show()"
]
},
{
"cell_type": "code",
"execution_count": null,
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3 (ipykernel)",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.11.5"
}
},
"nbformat": 4,
"nbformat_minor": 2
}
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment