51215903065
/
DaseTalentDocs


								{

								 "cells": [

								  {

								   "cell_type": "code",

								   "execution_count": 1,

								   "id": "b59dad38",

								   "metadata": {},

								   "outputs": [],

								   "source": [

								    "import pandas as pd\n",

								    "\n",

								    "\n",

								    "class FileTypeError(TypeError):\n",

								    "    pass\n",

								    "\n",

								    "\n",

								    "class ContestScore:\n",

								    "    # for eval(cur_info) in gen_max_cases_\n",

								    "    global null\n",

								    "    null = ''\n",

								    "\n",

								    "    def __init__(self, ):\n",

								    "        self.rank_path = ''\n",

								    "        self.submission_path = ''\n",

								    "        self.problem_path = ''\n",

								    "        self.ranks_df = None\n",

								    "        self.submission_df = None\n",

								    "        self.problem_df = None\n",

								    "        self.problem_names = []\n",

								    "        self.problem_ids = []\n",

								    "        self.contest_score = None\n",

								    "\n",

								    "        # for calculate max cases\n",

								    "        self.target_problem = 0\n",

								    "        self.gen_all_cases = True\n",

								    "\n",

								    "    def load_data(self, rank_path, submission_path, problem_path):\n",

								    "        # load data\n",

								    "        self.ranks_df = ContestScore.read_dataframe(rank_path)\n",

								    "        self.submission_df = ContestScore.read_dataframe(submission_path)\n",

								    "        self.rank_path = rank_path\n",

								    "        self.submission_path = submission_path\n",

								    "        rank_columns = self.ranks_df.columns.tolist()\n",

								    "        self.problem_names = rank_columns[6:]\n",

								    "\n",

								    "        # process ranks\n",

								    "        drop_data = ['User ID', 'Real Name', 'Total Submission'] + self.problem_names\n",

								    "        self.contest_score = self.ranks_df.drop(axis=1, columns=drop_data)\n",

								    "\n",

								    "        # calculate max cases\n",

								    "        self.contest_score['通过用例数'] = self.contest_score.apply(self.gen_max_cases, axis=1)\n",

								    "\n",

								    "        # get problem_names and problem_ids\n",

								    "        # calculate problem cases\n",

								    "        if problem_path:\n",

								    "            self.get_problems(problem_path)\n",

								    "            self.calculate()\n",

								    "        else:\n",

								    "            print(\"Please Set Problem names and ids by set_problems(names, ids) function\")\n",

								    "\n",

								    "        # sort scores\n",

								    "        self.sort()\n",

								    "\n",

								    "    def get_problems(self, problem_path):\n",

								    "        self.problem_df = ContestScore.read_dataframe(problem_path)\n",

								    "        self.problem_names = self.problem_df.title.to_list()\n",

								    "        self.problem_ids = self.problem_df.id.to_list()\n",

								    "        self.problem_path = problem_path\n",

								    "\n",

								    "    def gen_max_cases(self, df):\n",

								    "        self.gen_all_cases = True\n",

								    "        return self.gen_max_cases_(df)\n",

								    "\n",

								    "    def set_problems(self, problem_names, problem_ids):\n",

								    "        self.problem_names = problem_names\n",

								    "        self.problem_ids = problem_ids\n",

								    "\n",

								    "    def calculate(self):\n",

								    "        # calculate max cases for certain problems\n",

								    "        self.gen_all_cases = False\n",

								    "        for index, p_id in enumerate(self.problem_ids):\n",

								    "            self.target_problem = p_id\n",

								    "            p_name = self.problem_names[index]\n",

								    "            self.contest_score[p_name] = self.contest_score.apply(self.gen_max_cases_problem, axis=1)\n",

								    "\n",

								    "    def gen_max_cases_problem(self, df):\n",

								    "        self.gen_all_cases = False\n",

								    "        return self.gen_max_cases_(df)\n",

								    "\n",

								    "    def gen_max_cases_(self, df):\n",

								    "        cur_max_cases = {}\n",

								    "        for i in range(len(self.submission_df)):\n",

								    "            if str(self.submission_df.iloc[i]['username']) == str(df['Username']) \\\n",

								    "                    and (self.gen_all_cases or self.target_problem == self.submission_df.iloc[i]['problem_id']):\n",

								    "                try:\n",

								    "                    cur_info = self.submission_df.iloc[i]['info']\n",

								    "                    cur_problem_id = self.submission_df.iloc[i]['problem_id']\n",

								    "                    cur_score = sum(list(map(lambda x: x['result'] == 0, eval(cur_info)['data'])))\n",

								    "\n",

								    "                    if not (cur_problem_id in cur_max_cases.keys()):\n",

								    "                        cur_max_cases[cur_problem_id] = cur_score\n",

								    "                    elif cur_score > cur_max_cases[cur_problem_id]:\n",

								    "                        cur_max_cases[cur_problem_id] = cur_score\n",

								    "                except:\n",

								    "                    continue\n",

								    "        return sum(cur_max_cases.values())\n",

								    "\n",

								    "    def sort(self, by=['AC', '通过用例数', 'Total Time'], ascending=[False, False, True]):\n",

								    "        self.contest_score = self.contest_score.sort_values(by=by, ascending=ascending)\n",

								    "        return self.contest_score\n",

								    "\n",

								    "    def save(self, path):\n",

								    "        self.contest_score.to_excel(path, index=False)\n",

								    "        return f\"File Saved at {path} as Excel\"\n",

								    "\n",

								    "    @staticmethod\n",

								    "    def read_dataframe(path):\n",

								    "        filetype = path.split('.')[-1]\n",

								    "        dataframe = None\n",

								    "        if filetype == 'csv':\n",

								    "            dataframe = pd.read_csv(path)\n",

								    "        elif filetype == 'xlsx':\n",

								    "            dataframe = pd.read_excel(path)\n",

								    "        else:\n",

								    "            FileTypeError(filetype)\n",

								    "        return dataframe"

								   ]

								  },

								  {

								   "cell_type": "code",

								   "execution_count": 2,

								   "id": "09049d66",

								   "metadata": {},

								   "outputs": [],

								   "source": [

								    "test = ContestScore()"

								   ]

								  },

								  {

								   "cell_type": "code",

								   "execution_count": 3,

								   "id": "73373376",

								   "metadata": {},

								   "outputs": [

								    {

								     "name": "stdout",

								     "output_type": "stream",

								     "text": [

								      "\u001b[0m\u001b[38;5;167m机试成绩导出.ipynb\u001b[0m    \u001b[38;5;78mproblem_202207021234.csv\u001b[0m\r\n",

								      "\u001b[38;5;33;1mcontent-68-rank.xlsx\u001b[0m  \u001b[38;5;78msubmission_202207021235.csv\u001b[0m\r\n"

								     ]

								    }

								   ],

								   "source": [

								    "%ls"

								   ]

								  },

								  {

								   "cell_type": "code",

								   "execution_count": 4,

								   "id": "2b0cedc1",

								   "metadata": {

								    "scrolled": true

								   },

								   "outputs": [

								    {

								     "data": {

								      "text/plain": [

								       "'File Saved at Result.xlsx as Excel'"

								      ]

								     },

								     "execution_count": 4,

								     "metadata": {},

								     "output_type": "execute_result"

								    }

								   ],

								   "source": [

								    "# load data and calculate scores , ranks automatically\n",

								    "test.load_data(rank_path='./content-68-rank.xlsx', submission_path='./submission_202207021235.csv', problem_path='./problem_202207021234.csv')\n",

								    "\n",

								    "# retun the result by a pandas DataFrame\n",

								    "test.contest_score\n",

								    "\n",

								    "# Save result as excel\n",

								    "test.save('Result.xlsx')"

								   ]

								  },

								  {

								   "cell_type": "code",

								   "execution_count": null,

								   "id": "50e6428e",

								   "metadata": {},

								   "outputs": [],

								   "source": []

								  }

								 ],

								 "metadata": {

								  "kernelspec": {

								   "display_name": "Python 3 (ipykernel)",

								   "language": "python",

								   "name": "python3"

								  },

								  "language_info": {

								   "codemirror_mode": {

								    "name": "ipython",

								    "version": 3

								   },

								   "file_extension": ".py",

								   "mimetype": "text/x-python",

								   "name": "python",

								   "nbconvert_exporter": "python",

								   "pygments_lexer": "ipython3",

								   "version": "3.7.0"

								  }

								 },

								 "nbformat": 4,

								 "nbformat_minor": 5

								}