0% found this document useful (0 votes)

11 views6 pages

D3 Docs

Uploaded by

bttghlgsj

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

11 views6 pages

D3 Docs

Uploaded by

bttghlgsj

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as DOCX, PDF, TXT or read online on Scribd

You are on page 1/ 6

-- Create the books table

CREATE TABLE books (

book_id INT PRIMARY KEY,
title VARCHAR(255) NOT NULL,
edition VARCHAR(50),
author VARCHAR(255)
);

-- Insert data into the books table

INSERT INTO books (book_id, title, edition, author) VALUES (1, 'RAM', '1 EDITION', 'JOHN');
INSERT INTO books (book_id, title, edition, author) VALUES (2, 'sham', '2 EDITION', 'JOHN');
INSERT INTO books (book_id, title, edition, author) VALUES (3, 'pik', '3 EDITION', 'JOHN');
INSERT INTO books (book_id, title, edition, author) VALUES (4, 'ton', '4 EDITION', 'JOHN');
INSERT INTO books (book_id, title, edition, author) VALUES (5, 'mon', '5 EDITION', 'JOHN');

-- SLICE operation: count the books with '1 EDITION'

SELECT COUNT(book_id) AS num_books
FROM books
WHERE edition = '1 EDITION';

-- DICE operation: select books with the title 'pik'

SELECT book_id, title, edition
FROM books
WHERE title = 'pik';

-- ROLL-UP operation: group by edition and count the number of books for each
SELECT edition, COUNT(*) AS num_books
FROM books
GROUP BY edition;

-- DRILL-DOWN operation: select all books with the author 'JOHN'

SELECT *
FROM books
WHERE author = 'JOHN';

PAGE RANK
import numpy as np

def page_rank(n, links, d=0.85, max_iter=100, tol=1e-6):

transition_matrix = np.where(links.sum(axis=0) == 0, 1.0 / n, links / links.sum(axis=0))
ranks = np.ones(n) / n
for _ in range(max_iter):
new_ranks = (1 - d) / n + d * transition_matrix @ ranks
if np.linalg.norm(new_ranks - ranks, 1) < tol:
break
ranks = new_ranks
return ranks

def main():
n = int(input("Enter the number of pages: "))
links = np.array([list(map(int, input(f"Row {i + 1}: ").split())) for i in range(n)])
ranks = page_rank(n, links)
print("\nPageRank Values:")
for i, rank in enumerate(ranks, 1):
print(f"Page {i}: {rank:.6f}")

if __name__ == "__main__":
main()

output: Enter the number of pages: 3 PageRank Values:

Row 1: 0 1 1 Page 1: 0.333333
Row 2: 1 0 1 Page 2: 0.333333
Row 3: 1 1 0 Page 3: 0.333333

//DECISION TREE----------------------------------------------------------------------------------

import pandas as pd
from sklearn.datasets import load_iris
from sklearn.model_selection import train_test_split
from sklearn.tree import DecisionTreeClassifier
from sklearn.metrics import accuracy_score, classification_report, confusion_matrix

data = load_iris()
df = pd.DataFrame(data.data, columns=data.feature_names)
df['target'] = data.target

print("Dataset:")
print(df.head())

X = df.drop(columns=['target'])
y = df['target']

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=42)

classifier = DecisionTreeClassifier()
classifier.fit(X_train, y_train)

y_pred = classifier.predict(X_test)

accuracy = accuracy_score(y_test, y_pred)

print(f"\nAccuracy: {accuracy:.2f}")
print("\nClassification Report:")
print(classification_report(y_test, y_pred))
print("\nConfusion Matrix:")
print(confusion_matrix(y_test, y_pred))
APRIORI ALGO---------------------------------------------------------------------------------
class Transaction:
def __init__(self, items):
self.items = items

class Itemset:
def __init__(self, itemset):
self.itemset = itemset
self.count = 0

def get_user_input():
transactions = []
for _ in range(int(input("Enter the number of transactions: "))):
items = list(map(int, input("Enter items (comma-separated): ").split(',')))
transactions.append(Transaction(items))
return transactions

def count_items(transactions, num_items):

item_counts = [0] * (num_items + 1)
for transaction in transactions:
for item in transaction.items:
item_counts[item] += 1
return item_counts

def generate_candidates(prev_candidates, k):

return [Itemset(prev_candidates[i].itemset + [prev_candidates[j].itemset[k-2]])
for i in range(len(prev_candidates)) for j in range(i + 1, len(prev_candidates))
if prev_candidates[i].itemset[:k-2] == prev_candidates[j].itemset[:k-2]]

def calculate_support(candidates, transactions):

for candidate in candidates:
candidate.count = sum(1 for transaction in transactions if
set(candidate.itemset).issubset(transaction.items))

def prune_candidates(candidates, min_support):

return [candidate for candidate in candidates if candidate.count >= min_support]

def apriori(transactions, min_support):

item_counts = count_items(transactions, max(item for transaction in transactions for item in
transaction.items))
candidates = [Itemset([i]) for i in range(1, len(item_counts)) if item_counts[i] >= min_support]
k=2
while candidates:
calculate_support(candidates, transactions)
candidates = prune_candidates(candidates, min_support)
if candidates:
print(f"\nFrequent Itemsets of size {k}:")
for candidate in candidates:
print(f"{' '.join(map(str, candidate.itemset))} - Support: {candidate.count}")
candidates = generate_candidates(candidates, k)
k += 1

transactions = get_user_input()
min_support = int(input("Enter the minimum support (e.g., 2): "))
apriori(transactions, min_support)

OUTPUT:-------
Enter the number of transactions: 5
Enter items (comma-separated): 1,2
Enter items (comma-separated): 1
Enter items (comma-separated): 2
Enter items (comma-separated): 1,2,3
Enter items (comma-separated): 2,3
Enter the minimum support (e.g., 2): 2

Frequent Itemsets of size 2:

1 - Support: 3 Frequent Itemsets of size 3:
2 - Support: 4 1 2 - Support: 2
3 - Support: 2 2 3 - Support: 2

AGGLOMERATIVE hierarchical clustering--------------------------------------------------

import numpy as np
import matplotlib.pyplot as plt
import pandas as pd
from scipy.cluster.hierarchy import linkage, dendrogram as dendogram

def get_user_input():
n = int(input("Enter the number of points in the dataset: "))
X = []
print("Enter the co-ordinates (x,y) for each point: ")
for i in range(n):
while True:
try:
coords = input(f"Point {i+1}: ").split()
if len(coords) != 2:
raise ValueError("Please enter exactly two values separated by a space: ")
x, y = map(float, coords)
X.append([x, y])
break
except ValueError as e:
print(f"Invalid input: {e}. Please try again")
return np.array(X)

def hierarchical_clustering_with_dendogram(X, method='single'):

Z = linkage(X, method=method)
plt.figure(figsize=(8, 5))
dendogram(Z, labels=[f"Point {i+1}" for i in range(len(X))])
plt.title(f'Dendrogram ({method.capitalize()} Linkage)')
plt.xlabel('Point')
plt.ylabel('Distance')
plt.show()
table = pd.DataFrame(Z, columns=["Cluster 1", "Cluster 2", "Distance", "New Cluster Size"])
table["Cluster 1"] = table["Cluster 1"].astype(int) + 1
table["Cluster 2"] = table["Cluster 2"].astype(int) + 1
print(f"\n{method.capitalize()} Linkage Clustering Merges in Tabular Format")
print(table)

X = get_user_input()
print("Single Linkage Clustering:")
hierarchical_clustering_with_dendogram(X, method='single')
print("Complete Linkage Clustering:")
hierarchical_clustering_with_dendogram(X, method='complete')
print("Average Linkage Clustering:")
hierarchical_clustering_with_dendogram(X, method='average')

Output------------
Enter the number of points in the dataset: 6
Enter the co-ordinates (x,y) for each point:
Point 1: 0.4 0.53
Point 2: 0.22 0.38
Point 3: 0.35 0.32
Point 4: 0.26 0.19
Point 5: 0.08 0.41
Point 6: 0.45 0.30

Single Linkage Clustering:

Single Linkage Clustering Merges in Tabular Format
Cluster 1 Cluster 2 Distance New Cluster Size
3 5 0.101980 2.0
2 7 0.143178 3.0
6 8 0.143178 4.0
4 9 0.158114 5.0
1 10 0.215870 6.0

Complete Linkage Clustering:

Complete Linkage Clustering Merges in Tabular Format
Cluster 1 Cluster 2 Distance New Cluster Size
3 5 0.101980 2.0
2 6 0.143178 2.0
4 7 0.219545 3.0
1 8 0.341760 3.0
9 10 0.386005 6.0

Average Linkage Clustering:

Average Linkage Clustering Merges in Tabular Format
Cluster 1 Cluster 2 Distance New Cluster Size 4 7 0.188829 3.0
3 5 0.101980 2.0 8 9 0.255954 5.0
2 6 0.143178 2.0 1 10 0.279001 6.0
KMEAN ALGO-----------------------------------------------------------------------------------
from sklearn.cluster import KMeans
import numpy as np

# Get user input for data points

def get_user_data():
n = int(input("Enter the number of points: "))
data = []
for i in range(n):
value = float(input(f"Enter value for point {i+1}: "))
data.append([value])
return np.array(data)

data = get_user_data()

# Create and fit the KMeans model

kmeans = KMeans(n_clusters=2, random_state=0).fit(data)

# Retrieve the clusters and print the results

cluster_1 = data[kmeans.labels_ == 0]
cluster_2 = data[kmeans.labels_ == 1]

print("Cluster 1:", *cluster_1.flatten())

print("Cluster 2:", *cluster_2.flatten())

OUTPUT : -------------
Enter the number of points: 9
Enter value for point 1: 2
Enter value for point 2: 4
Enter value for point 3: 10
Enter value for point 4: 12
Enter value for point 5: 3
Enter value for point 6: 20
Enter value for point 7: 30
Enter value for point 8: 11
Enter value for point 9: 25
Cluster 1: 2.0 4.0 10.0 12.0 3.0 11.0
Cluster 2: 20.0 30.0 25.0

Page Rank
No ratings yet
Page Rank
7 pages
Prac7 8 9 10
No ratings yet
Prac7 8 9 10
12 pages
S6 - Data Mining Lab Experiments (Except 1)
No ratings yet
S6 - Data Mining Lab Experiments (Except 1)
6 pages
Data Mining Ex1
No ratings yet
Data Mining Ex1
10 pages
DWM Practical
No ratings yet
DWM Practical
12 pages
Practical 5
No ratings yet
Practical 5
6 pages
23CC554
No ratings yet
23CC554
10 pages
Code:: To Find Frequent Itemsets and Association Between Different Itemsets Using Apriori Algorithm
No ratings yet
Code:: To Find Frequent Itemsets and Association Between Different Itemsets Using Apriori Algorithm
28 pages
BDA Experiments
No ratings yet
BDA Experiments
41 pages
DM Lab Internal
No ratings yet
DM Lab Internal
37 pages
DWDM Lab Report
No ratings yet
DWDM Lab Report
10 pages
7 Output
No ratings yet
7 Output
4 pages
Mlda - Lab
No ratings yet
Mlda - Lab
35 pages
Data Warehousing and Data Mining
No ratings yet
Data Warehousing and Data Mining
24 pages
SOLUTION ONLY CODE DWDM - Lab - All
No ratings yet
SOLUTION ONLY CODE DWDM - Lab - All
8 pages
AIML Lab 10
No ratings yet
AIML Lab 10
4 pages
Implement Clustering Algorithms For Unsupervised Classification
No ratings yet
Implement Clustering Algorithms For Unsupervised Classification
4 pages
Wa0003
No ratings yet
Wa0003
16 pages
CMSDWM Exp 7
No ratings yet
CMSDWM Exp 7
13 pages
Assg 3
No ratings yet
Assg 3
31 pages
DWM
No ratings yet
DWM
12 pages
Aiml Assignment 10
No ratings yet
Aiml Assignment 10
6 pages
Tanu Raman ML Lab File
No ratings yet
Tanu Raman ML Lab File
21 pages
ML Shristi File
No ratings yet
ML Shristi File
49 pages
DWDM Lab All
No ratings yet
DWDM Lab All
20 pages
MLFILE
No ratings yet
MLFILE
21 pages
Data Mining Assignment No. 1
No ratings yet
Data Mining Assignment No. 1
22 pages
Python Basics for Data Science
No ratings yet
Python Basics for Data Science
30 pages
BIG DATA - Assign
No ratings yet
BIG DATA - Assign
28 pages
DMT Cia2
No ratings yet
DMT Cia2
11 pages
Data Mining - Project
100% (2)
Data Mining - Project
11 pages
Clustering
No ratings yet
Clustering
1 page
Data Mining Lab Manual
No ratings yet
Data Mining Lab Manual
7 pages
Apriori Algorithm & Clustering Guide
No ratings yet
Apriori Algorithm & Clustering Guide
8 pages
Data Analysis for Beginners
No ratings yet
Data Analysis for Beginners
1 page
PRGM 4
No ratings yet
PRGM 4
3 pages
ML Assignment
No ratings yet
ML Assignment
11 pages
ML Exp5 C36
No ratings yet
ML Exp5 C36
18 pages
DMDW Fielding Set
No ratings yet
DMDW Fielding Set
11 pages
Machine Learning Algorithms Guide
No ratings yet
Machine Learning Algorithms Guide
34 pages
1.1 Read The Data and Do Exploratory Data Analysis. Describe The Data Briefly
100% (19)
1.1 Read The Data and Do Exploratory Data Analysis. Describe The Data Briefly
50 pages
Prac9 23bme053
No ratings yet
Prac9 23bme053
4 pages
MLLab Manual
No ratings yet
MLLab Manual
24 pages
DSC Lab Programs
No ratings yet
DSC Lab Programs
24 pages
Project Data Mining (AMAN YADAV)
No ratings yet
Project Data Mining (AMAN YADAV)
12 pages
AI Lab Codes.
No ratings yet
AI Lab Codes.
12 pages
Week 6 (PCA, SVD, LDA)
No ratings yet
Week 6 (PCA, SVD, LDA)
14 pages
Aiml Lab
No ratings yet
Aiml Lab
37 pages
ML Programs
No ratings yet
ML Programs
14 pages
Program
No ratings yet
Program
2 pages
Data Clustering for Analysts
No ratings yet
Data Clustering for Analysts
8 pages
DWDM Lab Report
No ratings yet
DWDM Lab Report
12 pages
DWDM Lab Report
No ratings yet
DWDM Lab Report
26 pages
Merged
No ratings yet
Merged
35 pages
Week 8 DS Practical
No ratings yet
Week 8 DS Practical
13 pages
Chapter-2 1.: #Print (Train - Data)
No ratings yet
Chapter-2 1.: #Print (Train - Data)
9 pages
Data - Analytics Lab - Manual JNTUH R22 Regulation
No ratings yet
Data - Analytics Lab - Manual JNTUH R22 Regulation
26 pages
Advanced Database
No ratings yet
Advanced Database
23 pages
Machine Learning Lab
No ratings yet
Machine Learning Lab
33 pages
02 - Linux Checklist
No ratings yet
02 - Linux Checklist
6 pages
(FREE PDF Sample) Introduction To Mathematical Proofs A Transition To Advanced Mathematics 2nd Edition Charles E. Roberts Ebooks
No ratings yet
(FREE PDF Sample) Introduction To Mathematical Proofs A Transition To Advanced Mathematics 2nd Edition Charles E. Roberts Ebooks
67 pages
Taller I Grado Noveno Fernando Ahumada
No ratings yet
Taller I Grado Noveno Fernando Ahumada
3 pages
Assertion and Reasoning Questions Class 6
No ratings yet
Assertion and Reasoning Questions Class 6
3 pages
Social Science Club Game: History or Tsismis
No ratings yet
Social Science Club Game: History or Tsismis
4 pages
Bladesinger
No ratings yet
Bladesinger
4 pages
All Result Last
No ratings yet
All Result Last
276 pages
Neelam
No ratings yet
Neelam
21 pages
Helen Keller FREE English Sketchnotes Worksheets-C
No ratings yet
Helen Keller FREE English Sketchnotes Worksheets-C
7 pages
Class Time Table 2025 - 26
No ratings yet
Class Time Table 2025 - 26
10 pages
CPP STL Containers
No ratings yet
CPP STL Containers
1 page
Revised Chapter 15 Post Covid BSTD Grade 12 Notes On Presentation and Data Response
No ratings yet
Revised Chapter 15 Post Covid BSTD Grade 12 Notes On Presentation and Data Response
8 pages
P-CAD 2004 New Features
No ratings yet
P-CAD 2004 New Features
23 pages
Linux DHCP Server Notes
No ratings yet
Linux DHCP Server Notes
3 pages
Proto Indo European - Language
No ratings yet
Proto Indo European - Language
20 pages
Khyber Pakhtunkhwa Insights
No ratings yet
Khyber Pakhtunkhwa Insights
17 pages
Inspiring People #1
No ratings yet
Inspiring People #1
4 pages
Software Quality Engineering - Unit 3
No ratings yet
Software Quality Engineering - Unit 3
44 pages
Plan Lectie A 4a
No ratings yet
Plan Lectie A 4a
3 pages
GR 11 Geo Research Task Loadshedding 2025 (1) - Edited
100% (3)
GR 11 Geo Research Task Loadshedding 2025 (1) - Edited
16 pages
Modern Systems Analysis and Design - Design - Part 2
No ratings yet
Modern Systems Analysis and Design - Design - Part 2
53 pages
Great Ideas of Mathematics
No ratings yet
Great Ideas of Mathematics
2 pages
C Program for LL(1) Parsing Table
No ratings yet
C Program for LL(1) Parsing Table
25 pages
Legal Implications of All-Caps Names
No ratings yet
Legal Implications of All-Caps Names
23 pages
PPJOY Instructions
No ratings yet
PPJOY Instructions
2 pages
MC - Final Student List (HSC Form Fillup-2025) 19.3.25
No ratings yet
MC - Final Student List (HSC Form Fillup-2025) 19.3.25
200 pages
Kerala SSLC English Grammar Extended Activities Based On 16.10.2020 Class
No ratings yet
Kerala SSLC English Grammar Extended Activities Based On 16.10.2020 Class
13 pages
The Planners
No ratings yet
The Planners
10 pages
Ulysses - TEST
0% (1)
Ulysses - TEST
2 pages
Roles and Responsibilities of The MD and RSC Mission
No ratings yet
Roles and Responsibilities of The MD and RSC Mission
10 pages

D3 Docs

Uploaded by

D3 Docs

Uploaded by

-- Create the books table

CREATE TABLE books (

-- Insert data into the books table

-- SLICE operation: count the books with '1 EDITION'

-- DICE operation: select books with the title 'pik'

-- DRILL-DOWN operation: select all books with the author 'JOHN'

def page_rank(n, links, d=0.85, max_iter=100, tol=1e-6):

output: Enter the number of pages: 3 PageRank Values:

X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=42)

accuracy = accuracy_score(y_test, y_pred)

def count_items(transactions, num_items):

def generate_candidates(prev_candidates, k):

def calculate_support(candidates, transactions):

def prune_candidates(candidates, min_support):

def apriori(transactions, min_support):

Frequent Itemsets of size 2:

AGGLOMERATIVE hierarchical clustering--------------------------------------------------

def hierarchical_clustering_with_dendogram(X, method='single'):

Single Linkage Clustering:

Complete Linkage Clustering:

Average Linkage Clustering:

# Get user input for data points

# Create and fit the KMeans model

# Retrieve the clusters and print the results

print("Cluster 1:", *cluster_1.flatten())

You might also like