About Lesson
Join the conversation
data:image/s3,"s3://crabby-images/6738e/6738e6fe3587761ef8c1feed7953c495c03840c7" alt=""
# Function to convert sizes to MB
def convert_to_mb(size):
if "k" in size:
value = float(size.replace("k", ""))
return value / 1024 # Convert KB to MB
elif "M" in size:
return float(size.replace("M", "")) # Already in MB
else:
return None # Handle unexpected values# Apply the conversion function to the column
df["Size_in_MB"] = df["Size"].apply(convert_to_mb)
df.head()
Reply
data:image/s3,"s3://crabby-images/82d47/82d47f2854348d31b5f6c2802274c8fca249f35d" alt=""
all assignments sir,
# Function to convert sizes to MB
def convert_to_mb(size):
if 'm' in size.lower(): # Check if the value is in MB
return float(size.lower().replace('m', ''))
elif 'k' in size.lower(): # Check if the value is in KB
return float(size.lower().replace('k', '')) / 1024
else:
return None # Handle unexpected cases# Apply the conversion function to the Size column
df['Size'] = df['Size'].apply(convert_to_mb)
df.head()df["Price"] = df["Price"].str.replace("$","").astype(float)
df['Installs'] = (
df['Installs']
.str.replace(",", "", regex=True)
.str.strip()
.astype(int)
)
Reply
data:image/s3,"s3://crabby-images/82d47/82d47f2854348d31b5f6c2802274c8fca249f35d" alt=""
ASSIGNMENT
# Function to convert sizes to MB
def convert_to_mb(size):
if 'm' in size.lower(): # Check if the value is in MB
return float(size.lower().replace('m', ''))
elif 'k' in size.lower(): # Check if the value is in KB
return float(size.lower().replace('k', '')) / 1024
else:
return None # Handle unexpected cases# Apply the conversion function to the Size column
df['Size'] = df['Size'].apply(convert_to_mb)
df.head()
Reply
data:image/s3,"s3://crabby-images/8019d/8019dc0f3589c07582cd61bb0b769ede3bd9a1d5" alt=""
df['Price'] = df['Price'].str.replace('$', '')# Remove non-numeric values from the Price column
df['Price'] = pd.to_numeric(df['Price'], errors='coerce')# Replace NaN values with 0
df['Price'] = df['Price'].fillna(0)
Reply
data:image/s3,"s3://crabby-images/8019d/8019dc0f3589c07582cd61bb0b769ede3bd9a1d5" alt=""
df['Installs'] = df['Installs'].str.replace('+', '')# Replace 'Free' values with 0
df['Installs'] = df['Installs'].replace('Free', '0')# Convert the Installs column to integer values
df['Installs'] = df['Installs'].str.replace(',', '').astype(int)# Define the bins for the Installs column
bins_installs = [0, 1000, 10000, 100000, 1000000]# Define the labels for each bin
labels_installs = ['Few', 'Some', 'Many', 'Very Many']# Apply the binning method to the Installs column
df['Installs_Binned'] = pd.cut(df['Installs'], bins=bins_installs, labels=labels_installs)
Reply
data:image/s3,"s3://crabby-images/8019d/8019dc0f3589c07582cd61bb0b769ede3bd9a1d5" alt=""
def convert_to_mb(size):
if isinstance(size, str):
if size.endswith('k'):
return str(round(float(size[:-1]) / 1024, 2)) + 'M'
elif size.endswith('M'):
return size
elif isinstance(size, float) or isinstance(size, int):
return str(size) + 'M'
else:
return sizedf['Size'] = df['Size'].apply(convert_to_mb)
Reply
data:image/s3,"s3://crabby-images/b80b3/b80b3ae9e04ed406421b192a4d9eb25b5c50fc3b" alt=""
# Replace 'Varies with device' with NaN for numerical operations
df['Size'] = df['Size'].replace('Varies with device', np.nan)# Convert Size to numeric, handling 'k' and 'M'
def convert_size(size_str):
if pd.isna(size_str):
return np.nan
elif 'k' in size_str:
return float(size_str.replace('k', '')) / 1024
elif 'M' in size_str:
return float(size_str.replace('M', ''))
else:
return np.nandf['Size'] = df['Size'].apply(convert_size)# Clean 'Installs' column
df['Installs'] = df['Installs'].astype(str).str.replace('+', '').str.replace(',', '')
df['Installs'] = pd.to_numeric(df['Installs'], errors='coerce')#Handle 'Rating' column
df['Rating'] = pd.to_numeric(df['Rating'], errors='coerce')
Reply
data:image/s3,"s3://crabby-images/91523/9152381168dd00c061297a2e19315a80ebdb0786" alt=""
I have read both blogs. Both blogs are very informative.
Reply
data:image/s3,"s3://crabby-images/86197/861977be8cf86d49b9c89c9ac964fa8281fc13b3" alt=""
import numpy as np
kbs = 1024 # example value in KB
mbs = np.round(kbs / 1024, 2)
print(mbs
Reply
data:image/s3,"s3://crabby-images/f448e/f448e1c3363c9cbebcbef5b51dbe16856e42ba1b" alt=""
assignment done.
Reply