Add new files

ch-garcia · ch-garcia · commit 6a9a219d1f67 · 2025-03-19T15:24:37.000+01:00
diff --git a/introduction-pandas/2877-create-dataframe-list.py b/introduction-pandas/2877-create-dataframe-list.py
@@ -0,0 +1,39 @@
+"""
+2877. Create a DataFrame from List
+Solved
+Easy
+Companies
+Hint
+Write a solution to create a DataFrame from a 2D list called student_data. This 2D list contains the IDs and ages of some students.
+
+The DataFrame should have two columns, student_id and age, and be in the same order as the original 2D list.
+
+The result format is in the following example.
+
+Example 1:
+
+Input:
+student_data:
+[
+  [1, 15],
+  [2, 11],
+  [3, 11],
+  [4, 20]
+]
+Output:
++------------+-----+
+| student_id | age |
++------------+-----+
+| 1          | 15  |
+| 2          | 11  |
+| 3          | 11  |
+| 4          | 20  |
++------------+-----+
+Explanation:
+A DataFrame was created on top of student_data, with two columns named student_id and age."
+"""
+
+import pandas as pd
+
+def createDataframe(student_data: List[List[int]]) -> pd.DataFrame:
+    return pd.DataFrame(student_data, columns=["student_id", "age"])
diff --git a/introduction-pandas/2878-get-size-dataframe.py b/introduction-pandas/2878-get-size-dataframe.py
@@ -0,0 +1,51 @@
+"""
+2878. Get the Size of a DataFrame
+Solved
+Easy
+Companies
+Hint
+DataFrame players:
++-------------+--------+
+| Column Name | Type   |
++-------------+--------+
+| player_id   | int    |
+| name        | object |
+| age         | int    |
+| position    | object |
+| ...         | ...    |
++-------------+--------+
+Write a solution to calculate and display the number of rows and columns of players.
+
+Return the result as an array:
+
+[number of rows, number of columns]
+
+The result format is in the following example.
+
+Example 1:
+
+Input:
++-----------+----------+-----+-------------+--------------------+
+| player_id | name     | age | position    | team               |
++-----------+----------+-----+-------------+--------------------+
+| 846       | Mason    | 21  | Forward     | RealMadrid         |
+| 749       | Riley    | 30  | Winger      | Barcelona          |
+| 155       | Bob      | 28  | Striker     | ManchesterUnited   |
+| 583       | Isabella | 32  | Goalkeeper  | Liverpool          |
+| 388       | Zachary  | 24  | Midfielder  | BayernMunich       |
+| 883       | Ava      | 23  | Defender    | Chelsea            |
+| 355       | Violet   | 18  | Striker     | Juventus           |
+| 247       | Thomas   | 27  | Striker     | ParisSaint-Germain |
+| 761       | Jack     | 33  | Midfielder  | ManchesterCity     |
+| 642       | Charlie  | 36  | Center-back | Arsenal            |
++-----------+----------+-----+-------------+--------------------+
+Output:
+[10, 5]
+Explanation:
+This DataFrame contains 10 rows and 5 columns."
+"""
+
+import pandas as pd
+
+def getDataframeSize(players: pd.DataFrame) -> List[int]:
+    return list(players.shape)
diff --git a/introduction-pandas/2880-select-data.py b/introduction-pandas/2880-select-data.py
@@ -0,0 +1,43 @@
+"""
+2880. Select Data
+Solved
+Easy
+Companies
+Hint
+DataFrame students
++-------------+--------+
+| Column Name | Type   |
++-------------+--------+
+| student_id  | int    |
+| name        | object |
+| age         | int    |
++-------------+--------+
+
+Write a solution to select the name and age of the student with student_id = 101.
+
+The result format is in the following example.
+
+Example 1:
+Input:
++------------+---------+-----+
+| student_id | name    | age |
++------------+---------+-----+
+| 101        | Ulysses | 13  |
+| 53         | William | 10  |
+| 128        | Henry   | 6   |
+| 3          | Henry   | 11  |
++------------+---------+-----+
+Output:
++---------+-----+
+| name    | age | 
++---------+-----+
+| Ulysses | 13  |
++---------+-----+
+Explanation:
+Student Ulysses has student_id = 101, we select the name and age."
+"""
+
+import pandas as pd
+
+def selectData(students: pd.DataFrame) -> pd.DataFrame:
+    return students.loc[students["student_id"] == 101, ["name", "age"]]
diff --git a/introduction-pandas/2881-create-new-column.py b/introduction-pandas/2881-create-new-column.py
@@ -0,0 +1,53 @@
+"""
+2881. Create a New Column
+Solved
+Easy
+Companies
+Hint
+DataFrame employees
++-------------+--------+
+| Column Name | Type.  |
++-------------+--------+
+| name        | object |
+| salary      | int.   |
++-------------+--------+
+A company plans to provide its employees with a bonus.
+
+Write a solution to create a new column name bonus that contains the doubled values of the salary column.
+
+The result format is in the following example.
+
+Example 1:
+
+Input:
+DataFrame employees
++---------+--------+
+| name    | salary |
++---------+--------+
+| Piper   | 4548   |
+| Grace   | 28150  |
+| Georgia | 1103   |
+| Willow  | 6593   |
+| Finn    | 74576  |
+| Thomas  | 24433  |
++---------+--------+
+Output:
++---------+--------+--------+
+| name    | salary | bonus  |
++---------+--------+--------+
+| Piper   | 4548   | 9096   |
+| Grace   | 28150  | 56300  |
+| Georgia | 1103   | 2206   |
+| Willow  | 6593   | 13186  |
+| Finn    | 74576  | 149152 |
+| Thomas  | 24433  | 48866  |
++---------+--------+--------+
+Explanation: 
+A new column bonus is created by doubling the value in the column salary."
+"""
+
+import pandas as pd
+
+def createBonusColumn(employees: pd.DataFrame) -> pd.DataFrame:
+    employees["bonus"] = employees["salary"] * 2
+    return employees
diff --git a/introduction-pandas/2882-drop-duplicate-rows.py b/introduction-pandas/2882-drop-duplicate-rows.py
@@ -0,0 +1,52 @@
+"""
+2882. Drop Duplicate Rows
+Solved
+Easy
+Companies
+Hint
+DataFrame customers
++-------------+--------+
+| Column Name | Type   |
++-------------+--------+
+| customer_id | int    |
+| name        | object |
+| email       | object |
++-------------+--------+
+There are some duplicate rows in the DataFrame based on the email column.
+
+Write a solution to remove these duplicate rows and keep only the first occurrence.
+
+The result format is in the following example.
+
+ 
+
+Example 1:
+Input:
++-------------+---------+---------------------+
+| customer_id | name    | email               |
++-------------+---------+---------------------+
+| 1           | Ella    | emily@example.com   |
+| 2           | David   | michael@example.com |
+| 3           | Zachary | sarah@example.com   |
+| 4           | Alice   | john@example.com    |
+| 5           | Finn    | john@example.com    |
+| 6           | Violet  | alice@example.com   |
++-------------+---------+---------------------+
+Output:  
++-------------+---------+---------------------+
+| customer_id | name    | email               |
++-------------+---------+---------------------+
+| 1           | Ella    | emily@example.com   |
+| 2           | David   | michael@example.com |
+| 3           | Zachary | sarah@example.com   |
+| 4           | Alice   | john@example.com    |
+| 6           | Violet  | alice@example.com   |
++-------------+---------+---------------------+
+Explanation:
+Alic (customer_id = 4) and Finn (customer_id = 5) both use john@example.com, so only the first occurrence of this email is retained."
+"""
+
+import pandas as pd
+
+def dropDuplicateEmails(customers: pd.DataFrame) -> pd.DataFrame:
+    return customers.drop_duplicates("email")