0% found this document useful (0 votes)

14 views7 pages

Data Science

The document contains several Python functions addressing various problems, including counting unique identical strings, finding the maximum repeating sequence, determining the longest alternating subsequence, and calculating maximum subarray cost. It also includes functions for analyzing sales data, such as revenue generation, sales percentages, and identifying unsold products in cities. Additionally, a simple Flask web application is provided for collecting user feedback.

Uploaded by

shdh78253

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

14 views7 pages

Data Science

Uploaded by

shdh78253

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 7

# Unique identical strings

from typing import List

from collections import defaultdict

def solution(strs: List[str]) -> int:

# Dictionary to count occurrences of each unique character set

normalized_count = defaultdict(int)

# Normalize each string by considering only the unique characters

for s in strs:

normalized = ''.join(sorted(set(s))) # Sort the unique characters

normalized_count[normalized] += 1

# Calculate the number of identical pairs

identical_pairs = 0

for count in normalized_count.values():

if count > 1:

identical_pairs += count * (count - 1) // 2 # Combination formula

return identical_pairs

# Example usage:

strs1 = ["good", "god", "yarm", "bac", "aabc"]

print(solution(strs1)) # Expected output: 2

strs2 = ["cba", "nba", "dba"]

print(solution(strs2)) # Expected output: 0

# Max Repeating sequence

def maxRepeating(sequence: str, word: str) -> int:

count =0

while word *(count+1) in sequence:

count+=1

return count

maxRepeating("ababc", word= "ab")

# Longest Alternating string

def longest_alternating_subsequence(X):

if not X:

return 0

length = 1

for i in range(1, len(X)):

if X[i] != X[i - 1]: # Check if adjacent elements alternate

length += 1

return length

# Examples

X1 = [0, 1, 0, 1, 0]

X2 = [0]

print(longest_alternating_subsequence(X1)) # Output: 5

print(longest_alternating_subsequence(X2)) # Output: 1

#Maximum Subarray Cost

def max_subarray_cost(arr):

if not arr:

return 0

max_sum = float('-inf')

current_sum = 0

for num in arr:

current_sum += num

max_sum = max(max_sum, current_sum)

if current_sum < 0:

current_sum = 0

return max_sum ** 2

arr1 = [1, -1, 1, -1, 1]

arr2 = [1, 2, 3]

print(max_subarray_cost(arr1)) # Output: 1
print(max_subarray_cost(arr2)) # Output: 36

# Longest Common Prefix

def longest_common_prefix(input_string_lst):

if not input_string_lst:

return ""

prefix = input_string_lst[0]

for string in input_string_lst[1:]:

while not string.startswith(prefix):

prefix = prefix[:-1]

if not prefix:

return ""

return prefix

input_strings = ["relation", "renation", "restation"]

print("Longest Common Prefix:", longest_common_prefix(input_strings))

# Longest Postfix

def longest_common_postfix(input_string_lst):

if not input_string_lst:

return ""

suffix = input_string_lst[0]

for string in input_string_lst[1:]:

while not string.endswith(suffix):

suffix = suffix[1:]

if not suffix:

return ""

return suffix

input_strings = ["relation", "nation", "station"]

print("Longest Common Postfix:", longest_common_postfix(input_strings))

# EDA Future Engineering

# Question 1: How much revenue was generated from the three top-selling product
categories?

sales_data['Sales']=sales_data['Sales'].replace('[\$,]','',regex=True).astype(float)

top_categories_revenue = (df.groupby('Product Category')['Sales'].sum().nlargest(3))

print("Revenue from top 3 product categories:\n", top_categories_revenue)

print("Total revenue from top 3 categories: $", top_categories_revenue.sum())

# Question 2: What percentage of overall Sales do each of the categories contribute in

2019?

df['Order Date'] = pd.to_datetime(df['Order Date'])

df_2019 = df[df['Order Date'].dt.year == 2019]

category_sales_2019 = df_2019.groupby('Product Category')['Sales'].sum()

total_sales_2019 = category_sales_2019.sum()

category_sales_percentage = (category_sales_2019 / total_sales_2019) * 100

print("Percentage of overall sales by category in 2019:\n", category_sales_percentage)

# Question 3: Which product category shows the widest price range of products?

df['Price Each'] = df['Price Each'].replace({'\$': '', ',': ''}, regex=True).astype(float)

price_range = (df.groupby('Product Category')['Price Each'].agg(lambda x: x.max() - x.min()))

widest_price_range_category = price_range.idxmax()

print("Category with widest price range:", widest_price_range_category)

print("Price range for", widest_price_range_category, ":", price_range.max(), "$")

# Question 4: Plot the Sales trend for iPhone on a Monthly basis.

import matplotlib.pyplot as plt

df['Month'] = df['Order Date'].dt.to_period('M') # Extract Month

iphone_sales = df[df['Product'] == 'iPhone'].groupby('Month')['Sales'].sum()

iphone_sales.plot(kind='line', marker='o', figsize=(10, 6), title="Monthly iPhone Sales Trend")

plt.ylabel("Sales")

plt.xlabel("Month")

plt.show()
# Question 5: For every city, list the products that have not yet been sold in that city.

all_products = set(df['Product'].unique())

city_products = df.groupby('City')['Product'].apply(set)

unsold_products = {city: all_products - products for city, products in city_products.items()}

for city, products in unsold_products.items():

print(f"Unsold products in {city}: {products}")

# Question 6: List the top 3 cities in terms of the number of orders for each time of the day.

top_cities_time_of_day = (df.groupby(['Time of Day', 'City'])['OrderID']

.count().reset_index(name='Order Count'))

top_cities = (top_cities_time_of_day.groupby('Time of Day').apply(lambda x: x.nlargest

(3, 'Order Count')).reset_index(drop=True))

print("Top 3 cities for each time of day:\n", top_cities)

# Question 7: Find the top 3 customers by Sales.

top_customers = (df.groupby('Customer_ID')['Sales'].sum().nlargest(3))

print("Top 3 customers by sales:\n", top_customers)

# Simple Web Page

from flask import Flask, request

from markupsafe import escape

app = Flask(__name__)

# Homepage route

@app.route('/')

def index():

return '''

<form action="/submit" method="post">

Name: <input type="text" name="name"><br>

Email: <input type="text" name="email"><br>

Feedback: <textarea name="feedback"></textarea><br>

<input type="submit" value="Submit">

</form>

'''

# Feedback submission handler

@app.route('/submit', methods=['POST'])

def submit():

name = request.form['name']

email = request.form['email']

feedback = request.form['feedback']

if not name or not email or not feedback:

return("All Fields Required. Kindly fill the Name , Email and feedback")

name = escape(name)

email=escape(email)

feedback = escape(feedback)

return f'''

<h1>Thank You for Your Feedback!</h1>

<p><strong>Email:</strong> {email}</p>

<p><strong>Feedback:</strong> {feedback}</p>

'''

@app.errorhandler(404)

def page_not_found(e):

error_page = '''

<h1> 404 page not found <h1>

'''

return error_page

if __name__ == '__main__':

app.run(debug=True)

Python Usecases
No ratings yet
Python Usecases
46 pages
DSA Interview Questions
No ratings yet
DSA Interview Questions
14 pages
Python Ussecases Interview Based Questions: The-Grand-Complete-Data-Science-Materials
No ratings yet
Python Ussecases Interview Based Questions: The-Grand-Complete-Data-Science-Materials
23 pages
LeetCode Problems
No ratings yet
LeetCode Problems
4 pages
100 Questions
No ratings yet
100 Questions
20 pages
Complete DSA Interview
No ratings yet
Complete DSA Interview
35 pages
Top 50 DSA Pseudo Code Questions For Garrett Motio
No ratings yet
Top 50 DSA Pseudo Code Questions For Garrett Motio
15 pages
Python Algorithms and Data Structures Guide
No ratings yet
Python Algorithms and Data Structures Guide
28 pages
7 Eleven Technical Interview Answers
No ratings yet
7 Eleven Technical Interview Answers
4 pages
Python Practicale
No ratings yet
Python Practicale
7 pages
Google Coding Problems Solutions
No ratings yet
Google Coding Problems Solutions
3 pages
Leetcode 75 Blind - Part 1
No ratings yet
Leetcode 75 Blind - Part 1
11 pages
Python 50 Interview Guide Full
No ratings yet
Python 50 Interview Guide Full
21 pages
Python Functions for Common Tasks
No ratings yet
Python Functions for Common Tasks
3 pages
PracticalFile HITESH
No ratings yet
PracticalFile HITESH
29 pages
Python Max
No ratings yet
Python Max
7 pages
Array
No ratings yet
Array
7 pages
Python DSA Interview Solutions
No ratings yet
Python DSA Interview Solutions
14 pages
Python Lab Assignments Report
No ratings yet
Python Lab Assignments Report
32 pages
? Python Data Structures How To Use
No ratings yet
? Python Data Structures How To Use
9 pages
Probs
No ratings yet
Probs
18 pages
Code2pdf 6745a8e0eefda
No ratings yet
Code2pdf 6745a8e0eefda
2 pages
29 Final Review
No ratings yet
29 Final Review
59 pages
Arrays
No ratings yet
Arrays
17 pages
Final HW
No ratings yet
Final HW
11 pages
Quiz Complete
No ratings yet
Quiz Complete
4 pages
Pythonrecord
No ratings yet
Pythonrecord
13 pages
Python Practical
No ratings yet
Python Practical
20 pages
Answer Key For Pb-Ii
No ratings yet
Answer Key For Pb-Ii
12 pages
De Interview Raamashaamy Qna Bank
No ratings yet
De Interview Raamashaamy Qna Bank
11 pages
Python Interview Qes.
No ratings yet
Python Interview Qes.
9 pages
Python Programming Basics
No ratings yet
Python Programming Basics
17 pages
100 DSA Python
No ratings yet
100 DSA Python
45 pages
Arrays and Strings Solutions
No ratings yet
Arrays and Strings Solutions
4 pages
Slicing
No ratings yet
Slicing
9 pages
Simple
No ratings yet
Simple
4 pages
Real Python Interview Questions American Express
No ratings yet
Real Python Interview Questions American Express
7 pages
Project Ip
No ratings yet
Project Ip
51 pages
Practiceset 5
No ratings yet
Practiceset 5
11 pages
Leetcode Practice
No ratings yet
Leetcode Practice
67 pages
23BBS0006 VL2023240506353 Ast03
No ratings yet
23BBS0006 VL2023240506353 Ast03
8 pages
Class 10 T-1 Practical File
No ratings yet
Class 10 T-1 Practical File
8 pages
Python DS Notes Detailed
No ratings yet
Python DS Notes Detailed
6 pages
American Express Data Analyst DSA Interview Questions
No ratings yet
American Express Data Analyst DSA Interview Questions
16 pages
LAB 1 Assignment
No ratings yet
LAB 1 Assignment
4 pages
Leetcode 75
No ratings yet
Leetcode 75
10 pages
Python Cheatsheet 2
No ratings yet
Python Cheatsheet 2
4 pages
Python Lab PRG
No ratings yet
Python Lab PRG
20 pages
ÔN TẬP FINAL NGÔN NGỮ LẬP TRÌNH
No ratings yet
ÔN TẬP FINAL NGÔN NGỮ LẬP TRÌNH
121 pages
Day 11
No ratings yet
Day 11
7 pages
American Express
No ratings yet
American Express
16 pages
Assignment 3
No ratings yet
Assignment 3
7 pages
Cnba VCaacbjk
No ratings yet
Cnba VCaacbjk
2 pages
Cycle-I Solutions
No ratings yet
Cycle-I Solutions
7 pages
Computer Science Programs
No ratings yet
Computer Science Programs
13 pages
1 Dynamic Programming Programming: 1.1 1. Longest Increasing Subsequence
No ratings yet
1 Dynamic Programming Programming: 1.1 1. Longest Increasing Subsequence
21 pages
Competitive Programming Tasks 1
No ratings yet
Competitive Programming Tasks 1
11 pages
Python Lab Challenges
No ratings yet
Python Lab Challenges
12 pages
Mock 1
No ratings yet
Mock 1
14 pages
Molecular Regulation of NK Cell Maturation
No ratings yet
Molecular Regulation of NK Cell Maturation
28 pages
Genetic Links to Soccer Hamstring Injuries
No ratings yet
Genetic Links to Soccer Hamstring Injuries
8 pages
Population Genetics A Concise Guide, 2nd Edition Entire PDF Ebook
100% (11)
Population Genetics A Concise Guide, 2nd Edition Entire PDF Ebook
15 pages
ICSE Class 10 Question Paper Biology 2007 PDF
No ratings yet
ICSE Class 10 Question Paper Biology 2007 PDF
20 pages
Ellen 2010theories in Anthropology
No ratings yet
Ellen 2010theories in Anthropology
19 pages
Transposition 2
No ratings yet
Transposition 2
19 pages
Living World: Key Concepts & Questions
No ratings yet
Living World: Key Concepts & Questions
13 pages
Genetics Exam Practice
No ratings yet
Genetics Exam Practice
9 pages
Lecture 4
No ratings yet
Lecture 4
20 pages
Biology
No ratings yet
Biology
1 page
E1.2 Homework - Biologos Exploration - LoG-2
No ratings yet
E1.2 Homework - Biologos Exploration - LoG-2
3 pages
BS Biology Revised List of Major Courses
0% (1)
BS Biology Revised List of Major Courses
10 pages
Wiberg Et Al - 2019 - Genetics - Brain
No ratings yet
Wiberg Et Al - 2019 - Genetics - Brain
10 pages
Kuby 07 V 7
No ratings yet
Kuby 07 V 7
47 pages
Computational Biology
No ratings yet
Computational Biology
12 pages
Enhancer: Q1) What Is Role of Enhancers and Promoters in Transcription of Eukaryotes? Ans
No ratings yet
Enhancer: Q1) What Is Role of Enhancers and Promoters in Transcription of Eukaryotes? Ans
9 pages
DLP Mitosis
No ratings yet
DLP Mitosis
7 pages
Q1 Week 4 Biology G9
No ratings yet
Q1 Week 4 Biology G9
16 pages
Introduction To Prehistory - Pre and Protohistoric Cultures of India
No ratings yet
Introduction To Prehistory - Pre and Protohistoric Cultures of India
20 pages
Biology2 Q3 Module 3 Evolution and - Origin of Biodiversity
No ratings yet
Biology2 Q3 Module 3 Evolution and - Origin of Biodiversity
15 pages
Classification of Bilateria
No ratings yet
Classification of Bilateria
6 pages
Computing With DNA
No ratings yet
Computing With DNA
12 pages
Paper 3B
No ratings yet
Paper 3B
21 pages
Genomic Medicine Principles and Practice, 2nd Edition Premium Download
100% (21)
Genomic Medicine Principles and Practice, 2nd Edition Premium Download
15 pages
Ribosome Structure & Function Guide
No ratings yet
Ribosome Structure & Function Guide
20 pages
Chapter 13 End of Course - 241124 - 192023
No ratings yet
Chapter 13 End of Course - 241124 - 192023
4 pages
Microbiologist Career Profile
No ratings yet
Microbiologist Career Profile
4 pages
20630-Article Text-64327-77270-10-20160812
No ratings yet
20630-Article Text-64327-77270-10-20160812
8 pages
Sporophyte of Riccia
No ratings yet
Sporophyte of Riccia
9 pages
Activity # 12 Gene Therapy Answer
No ratings yet
Activity # 12 Gene Therapy Answer
3 pages

Data Science

Uploaded by

Data Science

Uploaded by

# Unique identical strings

from typing import List

from collections import defaultdict

def solution(strs: List[str]) -> int:

# Dictionary to count occurrences of each unique character set

# Normalize each string by considering only the unique characters

normalized = ''.join(sorted(set(s))) # Sort the unique characters

# Calculate the number of identical pairs

for count in normalized_count.values():

identical_pairs += count * (count - 1) // 2 # Combination formula

strs1 = ["good", "god", "yarm", "bac", "aabc"]

print(solution(strs1)) # Expected output: 2

strs2 = ["cba", "nba", "dba"]

print(solution(strs2)) # Expected output: 0

# Max Repeating sequence

def maxRepeating(sequence: str, word: str) -> int:

while word *(count+1) in sequence:

maxRepeating("ababc", word= "ab")

for i in range(1, len(X)):

if X[i] != X[i - 1]: # Check if adjacent elements alternate

#Maximum Subarray Cost

for num in arr:

max_sum = max(max_sum, current_sum)

arr1 = [1, -1, 1, -1, 1]

# Longest Common Prefix

for string in input_string_lst[1:]:

while not string.startswith(prefix):

input_strings = ["relation", "renation", "restation"]

print("Longest Common Prefix:", longest_common_prefix(input_strings))

for string in input_string_lst[1:]:

while not string.endswith(suffix):

input_strings = ["relation", "nation", "station"]

print("Longest Common Postfix:", longest_common_postfix(input_strings))

top_categories_revenue = (df.groupby('Product Category')['Sales'].sum().nlargest(3))

print("Revenue from top 3 product categories:\n", top_categories_revenue)

print("Total revenue from top 3 categories: $", top_categories_revenue.sum())

# Question 2: What percentage of overall Sales do each of the categories contribute in

df['Order Date'] = pd.to_datetime(df['Order Date'])

df_2019 = df[df['Order Date'].dt.year == 2019]

category_sales_2019 = df_2019.groupby('Product Category')['Sales'].sum()

category_sales_percentage = (category_sales_2019 / total_sales_2019) * 100

print("Percentage of overall sales by category in 2019:\n", category_sales_percentage)

df['Price Each'] = df['Price Each'].replace({'\$': '', ',': ''}, regex=True).astype(float)

price_range = (df.groupby('Product Category')['Price Each'].agg(lambda x: x.max() - x.min()))

print("Category with widest price range:", widest_price_range_category)

print("Price range for", widest_price_range_category, ":", price_range.max(), "$")

# Question 4: Plot the Sales trend for iPhone on a Monthly basis.

import matplotlib.pyplot as plt

df['Month'] = df['Order Date'].dt.to_period('M') # Extract Month

iphone_sales = df[df['Product'] == 'iPhone'].groupby('Month')['Sales'].sum()

iphone_sales.plot(kind='line', marker='o', figsize=(10, 6), title="Monthly iPhone Sales Trend")

unsold_products = {city: all_products - products for city, products in city_products.items()}

for city, products in unsold_products.items():

print(f"Unsold products in {city}: {products}")

top_cities_time_of_day = (df.groupby(['Time of Day', 'City'])['OrderID']

top_cities = (top_cities_time_of_day.groupby('Time of Day').apply(lambda x: x.nlargest

(3, 'Order Count')).reset_index(drop=True))

print("Top 3 cities for each time of day:\n", top_cities)

# Question 7: Find the top 3 customers by Sales.

print("Top 3 customers by sales:\n", top_customers)

# Simple Web Page

from flask import Flask, request

from markupsafe import escape

<form action="/submit" method="post">

Name: <input type="text" name="name"><br>

Email: <input type="text" name="email"><br>

Feedback: <textarea name="feedback"></textarea><br>

<input type="submit" value="Submit">

# Feedback submission handler

if not name or not email or not feedback:

<h1>Thank You for Your Feedback!</h1>

<h1> 404 page not found <h1>

You might also like