This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
#Task - Convert row into columns and create table | |
strdata = 'a,b,c,d,e,f,g,h,' | |
a = strdata.split(',') | |
for element in a: | |
print(element + str(' VARCHAR(100) NULL,')) | |
#a VARCHAR(100) NULL, | |
#b VARCHAR(100) NULL, | |
#c VARCHAR(100) NULL, | |
#Make The TSQL Statement | |
CREATE TABLE ATTRIBUTES ( | |
a VARCHAR(100) NULL, | |
b VARCHAR(100) NULL, | |
c VARCHAR(100) NULL | |
) | |
#Task - One hot encoder | |
#Step 1 - Load Data in Temp Table | |
#Step 2 - Create table to store unique values | |
create table cities | |
(cityid int identity(1,1), | |
name varchar(50) null) | |
#Step 3 - Push all unique values in Another temp table | |
insert into cities | |
select distinct(city) from decision_tree_featuredata | |
#Step 4 - Create new column to update the label values | |
Alter table decision_tree_featuredata | |
add city_id int null | |
#Step 5 - Update all the cities with numbers | |
update dt | |
set dt.city_id = ct.cityid | |
from decision_tree dt join cities ct | |
on dt.city = ct.name | |
Happy Learning!!!
No comments:
Post a Comment